Update BIG5-HKSCS charmap to HKSCS-2008
[platform/upstream/glibc.git] / iconvdata / euc-kr.c
1 /* Mapping tables for EUC-KR handling.
2    Copyright (C) 1998-2013 Free Software Foundation, Inc.
3    This file is part of the GNU C Library.
4    Contributed by Jungshik Shin <jshin@pantheon.yale.edu>
5    and Ulrich Drepper <drepper@cygnus.com>, 1998.
6
7    The GNU C Library is free software; you can redistribute it and/or
8    modify it under the terms of the GNU Lesser General Public
9    License as published by the Free Software Foundation; either
10    version 2.1 of the License, or (at your option) any later version.
11
12    The GNU C Library is distributed in the hope that it will be useful,
13    but WITHOUT ANY WARRANTY; without even the implied warranty of
14    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15    Lesser General Public License for more details.
16
17    You should have received a copy of the GNU Lesser General Public
18    License along with the GNU C Library; if not, see
19    <http://www.gnu.org/licenses/>.  */
20
21 #include <dlfcn.h>
22 #include <stdint.h>
23 #include <ksc5601.h>
24
25
26 static inline void
27 __attribute ((always_inline))
28 euckr_from_ucs4 (uint32_t ch, unsigned char *cp)
29 {
30   if (ch > 0x9f)
31     {
32       if (__builtin_expect (ch, 0) == 0x20a9)
33         {
34           /* Half-width Korean Currency WON sign.  There is no
35              equivalent in EUC-KR.  Some mappings use \x5c because
36              this is what some old Korean ASCII variants used but this
37              is causing problems.  We map it to the FULL WIDTH WON SIGN.  */
38           cp[0] = '\xa3';
39           cp[1] = '\xdc';
40         }
41       else if (__builtin_expect (ucs4_to_ksc5601 (ch, cp, 2), 0)
42           != __UNKNOWN_10646_CHAR)
43         {
44           cp[0] |= 0x80;
45           cp[1] |= 0x80;
46         }
47       else
48         cp[0] = cp[1] = '\0';
49     }
50   else
51     {
52       /* There is no mapping for U005c but we nevertheless map it to
53          \x5c.  */
54       cp[0] = (unsigned char) ch;
55       cp[1] = '\0';
56     }
57 }
58
59
60 /* Definitions used in the body of the `gconv' function.  */
61 #define CHARSET_NAME            "EUC-KR//"
62 #define FROM_LOOP               from_euc_kr
63 #define TO_LOOP                 to_euc_kr
64 #define DEFINE_INIT             1
65 #define DEFINE_FINI             1
66 #define MIN_NEEDED_FROM         1
67 #define MAX_NEEDED_FROM         2
68 #define MIN_NEEDED_TO           4
69
70
71 /* First define the conversion function from EUC-KR to UCS4.  */
72 #define MIN_NEEDED_INPUT        MIN_NEEDED_FROM
73 #define MAX_NEEDED_INPUT        MAX_NEEDED_FROM
74 #define MIN_NEEDED_OUTPUT       MIN_NEEDED_TO
75 #define LOOPFCT                 FROM_LOOP
76 #define BODY \
77   {                                                                           \
78     uint32_t ch = *inptr;                                                     \
79                                                                               \
80     if (ch <= 0x9f)                                                           \
81       ++inptr;                                                                \
82     /* 0xfe(->0x7e : row 94) and 0xc9(->0x59 : row 41) are                    \
83        user-defined areas.  */                                                \
84     else if (__builtin_expect (ch == 0xa0, 0)                                 \
85              || __builtin_expect (ch > 0xfe, 0)                               \
86              || __builtin_expect (ch == 0xc9, 0))                             \
87       {                                                                       \
88         /* This is illegal.  */                                               \
89         STANDARD_FROM_LOOP_ERR_HANDLER (1);                                   \
90       }                                                                       \
91     else                                                                      \
92       {                                                                       \
93         /* Two-byte character.  First test whether the next byte              \
94            is also available.  */                                             \
95         ch = ksc5601_to_ucs4 (&inptr, inend - inptr, 0x80);                   \
96         if (__builtin_expect (ch == 0, 0))                                    \
97           {                                                                   \
98             /* The second byte is not available.  */                          \
99             result = __GCONV_INCOMPLETE_INPUT;                                \
100             break;                                                            \
101           }                                                                   \
102         if (__builtin_expect (ch == __UNKNOWN_10646_CHAR, 0))                 \
103           /* This is an illegal character.  */                                \
104           STANDARD_FROM_LOOP_ERR_HANDLER (2);                                 \
105       }                                                                       \
106                                                                               \
107     put32 (outptr, ch);                                                       \
108     outptr += 4;                                                              \
109   }
110 #define LOOP_NEED_FLAGS
111 #define ONEBYTE_BODY \
112   {                                                                           \
113     if (c <= 0x9f)                                                            \
114       return c;                                                               \
115     else                                                                      \
116       return WEOF;                                                            \
117   }
118 #include <iconv/loop.c>
119
120
121 /* Next, define the other direction.  */
122 #define MIN_NEEDED_INPUT        MIN_NEEDED_TO
123 #define MIN_NEEDED_OUTPUT       MIN_NEEDED_FROM
124 #define MAX_NEEDED_OUTPUT       MAX_NEEDED_FROM
125 #define LOOPFCT                 TO_LOOP
126 #define BODY \
127   {                                                                           \
128     uint32_t ch = get32 (inptr);                                              \
129     unsigned char cp[2];                                                      \
130                                                                               \
131     /* Decomposing Hangul syllables not available in KS C 5601 into           \
132        Jamos should be considered either here or in euckr_from_ucs4() */      \
133     euckr_from_ucs4 (ch, cp);                                                 \
134                                                                               \
135     if (__builtin_expect (cp[0], '\1') == '\0' && ch != 0)                    \
136       {                                                                       \
137         UNICODE_TAG_HANDLER (ch, 4);                                          \
138                                                                               \
139         /* Illegal character.  */                                             \
140         STANDARD_TO_LOOP_ERR_HANDLER (4);                                     \
141       }                                                                       \
142                                                                               \
143     *outptr++ = cp[0];                                                        \
144     /* Now test for a possible second byte and write this if possible.  */    \
145     if (cp[1] != '\0')                                                        \
146       {                                                                       \
147         if (__builtin_expect (outptr >= outend, 0))                           \
148           {                                                                   \
149             /* The result does not fit into the buffer.  */                   \
150             --outptr;                                                         \
151             result = __GCONV_FULL_OUTPUT;                                     \
152             break;                                                            \
153           }                                                                   \
154         *outptr++ = cp[1];                                                    \
155       }                                                                       \
156                                                                               \
157     inptr += 4;                                                               \
158   }
159 #define LOOP_NEED_FLAGS
160 #include <iconv/loop.c>
161
162
163 /* Now define the toplevel functions.  */
164 #include <iconv/skeleton.c>