[glib] Add two-way script conversion functions
[profile/ivi/org.tizen.video-player.git] / src / hb-glib.cc
1 /*
2  * Copyright (C) 2009  Red Hat, Inc.
3  *
4  *  This is part of HarfBuzz, a text shaping library.
5  *
6  * Permission is hereby granted, without written agreement and without
7  * license or royalty fees, to use, copy, modify, and distribute this
8  * software and its documentation for any purpose, provided that the
9  * above copyright notice and the following two paragraphs appear in
10  * all copies of this software.
11  *
12  * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
13  * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
14  * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
15  * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
16  * DAMAGE.
17  *
18  * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
19  * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
20  * FITNESS FOR A PARTICULAR PURPOSE.  THE SOFTWARE PROVIDED HEREUNDER IS
21  * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
22  * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
23  *
24  * Red Hat Author(s): Behdad Esfahbod
25  */
26
27 #include "hb-private.h"
28
29 #include "hb-glib.h"
30
31 #include "hb-unicode-private.hh"
32
33 #include <glib.h>
34
35 HB_BEGIN_DECLS
36
37 static const hb_script_t
38 glib_script_to_script[] =
39 {
40   HB_SCRIPT_COMMON,
41   HB_SCRIPT_INHERITED,
42   HB_SCRIPT_ARABIC,
43   HB_SCRIPT_ARMENIAN,
44   HB_SCRIPT_BENGALI,
45   HB_SCRIPT_BOPOMOFO,
46   HB_SCRIPT_CHEROKEE,
47   HB_SCRIPT_COPTIC,
48   HB_SCRIPT_CYRILLIC,
49   HB_SCRIPT_DESERET,
50   HB_SCRIPT_DEVANAGARI,
51   HB_SCRIPT_ETHIOPIC,
52   HB_SCRIPT_GEORGIAN,
53   HB_SCRIPT_GOTHIC,
54   HB_SCRIPT_GREEK,
55   HB_SCRIPT_GUJARATI,
56   HB_SCRIPT_GURMUKHI,
57   HB_SCRIPT_HAN,
58   HB_SCRIPT_HANGUL,
59   HB_SCRIPT_HEBREW,
60   HB_SCRIPT_HIRAGANA,
61   HB_SCRIPT_KANNADA,
62   HB_SCRIPT_KATAKANA,
63   HB_SCRIPT_KHMER,
64   HB_SCRIPT_LAO,
65   HB_SCRIPT_LATIN,
66   HB_SCRIPT_MALAYALAM,
67   HB_SCRIPT_MONGOLIAN,
68   HB_SCRIPT_MYANMAR,
69   HB_SCRIPT_OGHAM,
70   HB_SCRIPT_OLD_ITALIC,
71   HB_SCRIPT_ORIYA,
72   HB_SCRIPT_RUNIC,
73   HB_SCRIPT_SINHALA,
74   HB_SCRIPT_SYRIAC,
75   HB_SCRIPT_TAMIL,
76   HB_SCRIPT_TELUGU,
77   HB_SCRIPT_THAANA,
78   HB_SCRIPT_THAI,
79   HB_SCRIPT_TIBETAN,
80   HB_SCRIPT_CANADIAN_ABORIGINAL,
81   HB_SCRIPT_YI,
82   HB_SCRIPT_TAGALOG,
83   HB_SCRIPT_HANUNOO,
84   HB_SCRIPT_BUHID,
85   HB_SCRIPT_TAGBANWA,
86
87   /* Unicode-4.0 additions */
88   HB_SCRIPT_BRAILLE,
89   HB_SCRIPT_CYPRIOT,
90   HB_SCRIPT_LIMBU,
91   HB_SCRIPT_OSMANYA,
92   HB_SCRIPT_SHAVIAN,
93   HB_SCRIPT_LINEAR_B,
94   HB_SCRIPT_TAI_LE,
95   HB_SCRIPT_UGARITIC,
96
97   /* Unicode-4.1 additions */
98   HB_SCRIPT_NEW_TAI_LUE,
99   HB_SCRIPT_BUGINESE,
100   HB_SCRIPT_GLAGOLITIC,
101   HB_SCRIPT_TIFINAGH,
102   HB_SCRIPT_SYLOTI_NAGRI,
103   HB_SCRIPT_OLD_PERSIAN,
104   HB_SCRIPT_KHAROSHTHI,
105
106   /* Unicode-5.0 additions */
107   HB_SCRIPT_UNKNOWN,
108   HB_SCRIPT_BALINESE,
109   HB_SCRIPT_CUNEIFORM,
110   HB_SCRIPT_PHOENICIAN,
111   HB_SCRIPT_PHAGS_PA,
112   HB_SCRIPT_NKO,
113
114   /* Unicode-5.1 additions */
115   HB_SCRIPT_KAYAH_LI,
116   HB_SCRIPT_LEPCHA,
117   HB_SCRIPT_REJANG,
118   HB_SCRIPT_SUNDANESE,
119   HB_SCRIPT_SAURASHTRA,
120   HB_SCRIPT_CHAM,
121   HB_SCRIPT_OL_CHIKI,
122   HB_SCRIPT_VAI,
123   HB_SCRIPT_CARIAN,
124   HB_SCRIPT_LYCIAN,
125   HB_SCRIPT_LYDIAN,
126
127   /* Unicode-5.2 additions */
128   HB_SCRIPT_AVESTAN,
129   HB_SCRIPT_BAMUM,
130   HB_SCRIPT_EGYPTIAN_HIEROGLYPHS,
131   HB_SCRIPT_IMPERIAL_ARAMAIC,
132   HB_SCRIPT_INSCRIPTIONAL_PAHLAVI,
133   HB_SCRIPT_INSCRIPTIONAL_PARTHIAN,
134   HB_SCRIPT_JAVANESE,
135   HB_SCRIPT_KAITHI,
136   HB_SCRIPT_TAI_THAM,
137   HB_SCRIPT_LISU,
138   HB_SCRIPT_MEETEI_MAYEK,
139   HB_SCRIPT_OLD_SOUTH_ARABIAN,
140   HB_SCRIPT_OLD_TURKIC,
141   HB_SCRIPT_SAMARITAN,
142   HB_SCRIPT_TAI_VIET,
143
144   /* Unicode-6.0 additions */
145   HB_SCRIPT_BATAK,
146   HB_SCRIPT_BRAHMI,
147   HB_SCRIPT_MANDAIC
148 };
149
150 hb_script_t
151 hb_glib_script_to_script (GUnicodeScript script)
152 {
153   if (likely ((unsigned int) script < ARRAY_LENGTH (glib_script_to_script)))
154     return glib_script_to_script[script];
155
156   if (unlikely (script == G_UNICODE_SCRIPT_INVALID_CODE))
157     return HB_SCRIPT_INVALID;
158
159   return HB_SCRIPT_UNKNOWN;
160 }
161
162 GUnicodeScript
163 hb_glib_script_from_script (hb_script_t script)
164 {
165   unsigned int count = ARRAY_LENGTH (glib_script_to_script);
166   for (unsigned int i = 0; i < count; i++)
167     if (glib_script_to_script[i] == script)
168       return (GUnicodeScript) i;
169
170   if (unlikely (script == HB_SCRIPT_INVALID))
171     return G_UNICODE_SCRIPT_INVALID_CODE;
172
173   return G_UNICODE_SCRIPT_UNKNOWN;
174 }
175
176
177 static unsigned int
178 hb_glib_get_combining_class (hb_unicode_funcs_t *ufuncs,
179                              hb_codepoint_t      unicode,
180                              void               *user_data)
181
182 {
183   return g_unichar_combining_class (unicode);
184 }
185
186 static unsigned int
187 hb_glib_get_eastasian_width (hb_unicode_funcs_t *ufuncs,
188                              hb_codepoint_t      unicode,
189                              void               *user_data)
190 {
191   return g_unichar_iswide (unicode) ? 2 : 1;
192 }
193
194 static hb_unicode_general_category_t
195 hb_glib_get_general_category (hb_unicode_funcs_t *ufuncs,
196                               hb_codepoint_t      unicode,
197                               void               *user_data)
198
199 {
200   /* hb_unicode_general_category_t and GUnicodeType are identical */
201   return (hb_unicode_general_category_t) g_unichar_type (unicode);
202 }
203
204 static hb_codepoint_t
205 hb_glib_get_mirroring (hb_unicode_funcs_t *ufuncs,
206                        hb_codepoint_t      unicode,
207                        void               *user_data)
208 {
209   g_unichar_get_mirror_char (unicode, &unicode);
210   return unicode;
211 }
212
213 static hb_script_t
214 hb_glib_get_script (hb_unicode_funcs_t *ufuncs,
215                     hb_codepoint_t      unicode,
216                     void               *user_data)
217 {
218   return hb_glib_script_to_script (g_unichar_get_script (unicode));
219 }
220
221 static hb_unicode_funcs_t glib_ufuncs = {
222   HB_REFERENCE_COUNT_INVALID, /* ref_count */
223   NULL, /* parent */
224   TRUE, /* immutable */
225   {
226     hb_glib_get_combining_class,
227     hb_glib_get_eastasian_width,
228     hb_glib_get_general_category,
229     hb_glib_get_mirroring,
230     hb_glib_get_script
231   }
232 };
233
234 hb_unicode_funcs_t *
235 hb_glib_get_unicode_funcs (void)
236 {
237   return &glib_ufuncs;
238 }
239
240
241 HB_END_DECLS