2 * Copyright (C) 2009,2010 Red Hat, Inc.
4 * This is part of HarfBuzz, a text shaping library.
6 * Permission is hereby granted, without written agreement and without
7 * license or royalty fees, to use, copy, modify, and distribute this
8 * software and its documentation for any purpose, provided that the
9 * above copyright notice and the following two paragraphs appear in
10 * all copies of this software.
12 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
13 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
14 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
15 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
18 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
19 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
20 * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
21 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
22 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
24 * Red Hat Author(s): Behdad Esfahbod
27 #include "hb-private.h"
35 hb_tag_from_string (const char *s)
43 for (i = 0; i < 4 && s[i]; i++)
48 return HB_TAG_CHAR4 (tag);
54 struct _hb_language_t {
58 static const char canon_map[256] = {
59 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
60 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
61 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, '-', 0, 0,
62 '0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 0, 0, 0, 0, 0, 0,
63 '-', 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o',
64 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', 0, 0, 0, 0, '-',
65 0, 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o',
66 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', 0, 0, 0, 0, 0
70 lang_equal (const void *v1,
73 const unsigned char *p1 = v1;
74 const unsigned char *p2 = v2;
76 while (canon_map[*p1] && canon_map[*p1] == canon_map[*p2])
81 return (canon_map[*p1] == canon_map[*p2]);
86 lang_hash (const void *key)
88 const unsigned char *p = key;
92 h = (h << 5) - h + canon_map[*p];
102 hb_language_from_string (const char *str)
104 static unsigned int num_langs;
105 static unsigned int num_alloced;
106 static hb_language_t *langs;
110 /* TODO Use a hash table or something */
115 for (i = 0; i < num_langs; i++)
116 if (lang_equal (str, langs[i]->s))
119 if (unlikely (num_langs == num_alloced)) {
120 unsigned int new_alloced = 2 * (8 + num_alloced);
121 hb_language_t *new_langs = realloc (langs, new_alloced * sizeof (langs[0]));
124 num_alloced = new_alloced;
128 langs[i] = (hb_language_t) strdup (str);
129 for (p = (unsigned char *) langs[i]->s; *p; p++)
138 hb_language_to_string (hb_language_t language)
147 hb_script_from_iso15924_tag (hb_tag_t tag)
149 /* Be lenient, adjust case (one capital letter followed by three small letters) */
150 tag = (tag & 0xDFDFDFDF) | 0x00202020;
153 case HB_TAG('C','y','r','s'): return HB_SCRIPT_CYRILLIC;
154 case HB_TAG('G','e','o','a'): return HB_SCRIPT_GEORGIAN;
155 case HB_TAG('G','e','o','n'): return HB_SCRIPT_GEORGIAN;
156 case HB_TAG('L','a','t','f'): return HB_SCRIPT_LATIN;
157 case HB_TAG('L','a','t','g'): return HB_SCRIPT_LATIN;
158 case HB_TAG('S','y','r','e'): return HB_SCRIPT_SYRIAC;
159 case HB_TAG('S','y','r','j'): return HB_SCRIPT_SYRIAC;
160 case HB_TAG('S','y','r','n'): return HB_SCRIPT_SYRIAC;
163 /* If it looks right, just use the tag as a script */
164 if (((uint32_t) tag & 0xE0E0E0E0) == 0x40606060)
165 return (hb_script_t) tag;
167 /* Otherwise, return unknown */
168 return HB_SCRIPT_UNKNOWN;
172 hb_script_from_string (const char *s)
174 return hb_script_from_iso15924_tag (hb_tag_from_string (s));
178 hb_script_to_iso15924_tag (hb_script_t script)
180 return (hb_tag_t) script;
184 hb_script_get_horizontal_direction (hb_script_t script)
186 switch ((hb_tag_t) script)
188 case HB_SCRIPT_ARABIC:
189 case HB_SCRIPT_HEBREW:
190 case HB_SCRIPT_SYRIAC:
191 case HB_SCRIPT_THAANA:
193 /* Unicode-4.0 additions */
194 case HB_SCRIPT_CYPRIOT:
196 /* Unicode-5.0 additions */
197 case HB_SCRIPT_PHOENICIAN:
200 /* Unicode-5.2 additions */
201 case HB_SCRIPT_AVESTAN:
202 case HB_SCRIPT_IMPERIAL_ARAMAIC:
203 case HB_SCRIPT_INSCRIPTIONAL_PAHLAVI:
204 case HB_SCRIPT_INSCRIPTIONAL_PARTHIAN:
205 case HB_SCRIPT_OLD_SOUTH_ARABIAN:
206 case HB_SCRIPT_OLD_TURKIC:
207 case HB_SCRIPT_SAMARITAN:
209 /* Unicode-6.0 additions */
210 case HB_SCRIPT_MANDAIC:
212 return HB_DIRECTION_RTL;
215 return HB_DIRECTION_LTR;