Minor
[framework/uifw/harfbuzz.git] / src / hb-icu.cc
1 /*
2  * Copyright © 2009  Red Hat, Inc.
3  * Copyright © 2009  Keith Stribley
4  * Copyright © 2011  Google, Inc.
5  *
6  *  This is part of HarfBuzz, a text shaping library.
7  *
8  * Permission is hereby granted, without written agreement and without
9  * license or royalty fees, to use, copy, modify, and distribute this
10  * software and its documentation for any purpose, provided that the
11  * above copyright notice and the following two paragraphs appear in
12  * all copies of this software.
13  *
14  * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
15  * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
16  * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
17  * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
18  * DAMAGE.
19  *
20  * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
21  * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
22  * FITNESS FOR A PARTICULAR PURPOSE.  THE SOFTWARE PROVIDED HEREUNDER IS
23  * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
24  * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
25  *
26  * Red Hat Author(s): Behdad Esfahbod
27  * Google Author(s): Behdad Esfahbod
28  */
29
30 #include "hb-private.hh"
31
32 #include "hb-icu.h"
33
34 #include "hb-unicode-private.hh"
35
36 #include <unicode/uversion.h>
37 #include <unicode/uchar.h>
38
39 HB_BEGIN_DECLS
40
41
42 hb_script_t
43 hb_icu_script_to_script (UScriptCode script)
44 {
45   if (unlikely (script == USCRIPT_INVALID_CODE))
46     return HB_SCRIPT_INVALID;
47
48   return hb_script_from_string (uscript_getShortName (script));
49 }
50
51 UScriptCode
52 hb_icu_script_from_script (hb_script_t script)
53 {
54   if (unlikely (script == HB_SCRIPT_INVALID))
55     return USCRIPT_INVALID_CODE;
56
57   for (unsigned int i = 0; i < USCRIPT_CODE_LIMIT; i++)
58     if (unlikely (hb_icu_script_to_script ((UScriptCode) i) == script))
59       return (UScriptCode) i;
60
61   return USCRIPT_UNKNOWN;
62 }
63
64
65 static unsigned int
66 hb_icu_get_combining_class (hb_unicode_funcs_t *ufuncs HB_UNUSED,
67                             hb_codepoint_t      unicode,
68                             void               *user_data HB_UNUSED)
69
70 {
71   return u_getCombiningClass (unicode);
72 }
73
74 static unsigned int
75 hb_icu_get_eastasian_width (hb_unicode_funcs_t *ufuncs HB_UNUSED,
76                             hb_codepoint_t      unicode,
77                             void               *user_data HB_UNUSED)
78 {
79   switch (u_getIntPropertyValue(unicode, UCHAR_EAST_ASIAN_WIDTH))
80   {
81   case U_EA_WIDE:
82   case U_EA_FULLWIDTH:
83     return 2;
84   case U_EA_NEUTRAL:
85   case U_EA_AMBIGUOUS:
86   case U_EA_HALFWIDTH:
87   case U_EA_NARROW:
88     return 1;
89   }
90   return 1;
91 }
92
93 static hb_unicode_general_category_t
94 hb_icu_get_general_category (hb_unicode_funcs_t *ufuncs HB_UNUSED,
95                              hb_codepoint_t      unicode,
96                              void               *user_data HB_UNUSED)
97 {
98   switch (u_getIntPropertyValue(unicode, UCHAR_GENERAL_CATEGORY))
99   {
100   case U_UNASSIGNED:                    return HB_UNICODE_GENERAL_CATEGORY_UNASSIGNED;
101
102   case U_UPPERCASE_LETTER:              return HB_UNICODE_GENERAL_CATEGORY_UPPERCASE_LETTER;
103   case U_LOWERCASE_LETTER:              return HB_UNICODE_GENERAL_CATEGORY_LOWERCASE_LETTER;
104   case U_TITLECASE_LETTER:              return HB_UNICODE_GENERAL_CATEGORY_TITLECASE_LETTER;
105   case U_MODIFIER_LETTER:               return HB_UNICODE_GENERAL_CATEGORY_MODIFIER_LETTER;
106   case U_OTHER_LETTER:                  return HB_UNICODE_GENERAL_CATEGORY_OTHER_LETTER;
107
108   case U_NON_SPACING_MARK:              return HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK;
109   case U_ENCLOSING_MARK:                return HB_UNICODE_GENERAL_CATEGORY_ENCLOSING_MARK;
110   case U_COMBINING_SPACING_MARK:        return HB_UNICODE_GENERAL_CATEGORY_COMBINING_MARK;
111
112   case U_DECIMAL_DIGIT_NUMBER:          return HB_UNICODE_GENERAL_CATEGORY_DECIMAL_NUMBER;
113   case U_LETTER_NUMBER:                 return HB_UNICODE_GENERAL_CATEGORY_LETTER_NUMBER;
114   case U_OTHER_NUMBER:                  return HB_UNICODE_GENERAL_CATEGORY_OTHER_NUMBER;
115
116   case U_SPACE_SEPARATOR:               return HB_UNICODE_GENERAL_CATEGORY_SPACE_SEPARATOR;
117   case U_LINE_SEPARATOR:                return HB_UNICODE_GENERAL_CATEGORY_LINE_SEPARATOR;
118   case U_PARAGRAPH_SEPARATOR:           return HB_UNICODE_GENERAL_CATEGORY_PARAGRAPH_SEPARATOR;
119
120   case U_CONTROL_CHAR:                  return HB_UNICODE_GENERAL_CATEGORY_CONTROL;
121   case U_FORMAT_CHAR:                   return HB_UNICODE_GENERAL_CATEGORY_FORMAT;
122   case U_PRIVATE_USE_CHAR:              return HB_UNICODE_GENERAL_CATEGORY_PRIVATE_USE;
123   case U_SURROGATE:                     return HB_UNICODE_GENERAL_CATEGORY_SURROGATE;
124
125
126   case U_DASH_PUNCTUATION:              return HB_UNICODE_GENERAL_CATEGORY_DASH_PUNCTUATION;
127   case U_START_PUNCTUATION:             return HB_UNICODE_GENERAL_CATEGORY_OPEN_PUNCTUATION;
128   case U_END_PUNCTUATION:               return HB_UNICODE_GENERAL_CATEGORY_CLOSE_PUNCTUATION;
129   case U_CONNECTOR_PUNCTUATION:         return HB_UNICODE_GENERAL_CATEGORY_CONNECT_PUNCTUATION;
130   case U_OTHER_PUNCTUATION:             return HB_UNICODE_GENERAL_CATEGORY_OTHER_PUNCTUATION;
131
132   case U_MATH_SYMBOL:                   return HB_UNICODE_GENERAL_CATEGORY_MATH_SYMBOL;
133   case U_CURRENCY_SYMBOL:               return HB_UNICODE_GENERAL_CATEGORY_CURRENCY_SYMBOL;
134   case U_MODIFIER_SYMBOL:               return HB_UNICODE_GENERAL_CATEGORY_MODIFIER_SYMBOL;
135   case U_OTHER_SYMBOL:                  return HB_UNICODE_GENERAL_CATEGORY_OTHER_SYMBOL;
136
137   case U_INITIAL_PUNCTUATION:           return HB_UNICODE_GENERAL_CATEGORY_INITIAL_PUNCTUATION;
138   case U_FINAL_PUNCTUATION:             return HB_UNICODE_GENERAL_CATEGORY_FINAL_PUNCTUATION;
139   }
140
141   return HB_UNICODE_GENERAL_CATEGORY_UNASSIGNED;
142 }
143
144 static hb_codepoint_t
145 hb_icu_get_mirroring (hb_unicode_funcs_t *ufuncs HB_UNUSED,
146                       hb_codepoint_t      unicode,
147                       void               *user_data HB_UNUSED)
148 {
149   return u_charMirror(unicode);
150 }
151
152 static hb_script_t
153 hb_icu_get_script (hb_unicode_funcs_t *ufuncs HB_UNUSED,
154                    hb_codepoint_t      unicode,
155                    void               *user_data HB_UNUSED)
156 {
157   UErrorCode status = U_ZERO_ERROR;
158   UScriptCode scriptCode = uscript_getScript(unicode, &status);
159
160   if (unlikely (status != U_ZERO_ERROR))
161     return HB_SCRIPT_UNKNOWN;
162
163   return hb_icu_script_to_script (scriptCode);
164 }
165
166 extern HB_INTERNAL hb_unicode_funcs_t _hb_unicode_funcs_icu;
167 hb_unicode_funcs_t _hb_icu_unicode_funcs = {
168   HB_OBJECT_HEADER_STATIC,
169
170   NULL, /* parent */
171   TRUE, /* immutable */
172   {
173     hb_icu_get_combining_class,
174     hb_icu_get_eastasian_width,
175     hb_icu_get_general_category,
176     hb_icu_get_mirroring,
177     hb_icu_get_script
178   }
179 };
180
181 hb_unicode_funcs_t *
182 hb_icu_get_unicode_funcs (void)
183 {
184   return &_hb_icu_unicode_funcs;
185 }
186
187
188 HB_END_DECLS