1 /* shmbutil.h -- utility functions for multibyte characters. */
3 /* Copyright (C) 2002-2004 Free Software Foundation, Inc.
5 This file is part of GNU Bash, the Bourne Again SHell.
7 Bash is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 2, or (at your option) any later
12 Bash is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
17 You should have received a copy of the GNU General Public License along
18 with Bash; see the file COPYING. If not, write to the Free Software
19 Foundation, 59 Temple Place, Suite 330, Boston, MA 02111 USA. */
21 #if !defined (_SH_MBUTIL_H_)
26 /* Include config.h for HANDLE_MULTIBYTE */
29 #if defined (HANDLE_MULTIBYTE)
31 extern size_t xmbsrtowcs __P((wchar_t *, const char **, size_t, mbstate_t *));
32 extern size_t xdupmbstowcs __P((wchar_t **, char ***, const char *));
34 extern size_t mbstrlen __P((const char *));
36 extern char *xstrchr __P((const char *, int));
39 #define MB_INVALIDCH(x) ((x) == (size_t)-1 || (x) == (size_t)-2)
40 #define MB_NULLWCH(x) ((x) == 0)
43 #define MBSLEN(s) (((s) && (s)[0]) ? ((s)[1] ? mbstrlen (s) : 1) : 0)
44 #define MB_STRLEN(s) ((MB_CUR_MAX > 1) ? MBSLEN (s) : STRLEN (s))
46 #else /* !HANDLE_MULTIBYTE */
55 #define xstrchr(s, c) strchr(s, c)
58 #define MB_INVALIDCH(x) (0)
59 #define MB_NULLWCH(x) (0)
62 #define MB_STRLEN(s) (STRLEN(s))
64 #endif /* !HANDLE_MULTIBYTE */
66 /* Declare and initialize a multibyte state. Call must be terminated
68 #if defined (HANDLE_MULTIBYTE)
69 # define DECLARE_MBSTATE \
71 memset (&state, '\0', sizeof (mbstate_t))
73 # define DECLARE_MBSTATE
74 #endif /* !HANDLE_MULTIBYTE */
76 /* Initialize or reinitialize a multibyte state named `state'. Call must be
77 terminated with `;'. */
78 #if defined (HANDLE_MULTIBYTE)
79 # define INITIALIZE_MBSTATE memset (&state, '\0', sizeof (mbstate_t))
81 # define INITIALIZE_MBSTATE
82 #endif /* !HANDLE_MULTIBYTE */
84 /* Advance one (possibly multi-byte) character in string _STR of length
85 _STRSIZE, starting at index _I. STATE must have already been declared. */
86 #if defined (HANDLE_MULTIBYTE)
87 # define ADVANCE_CHAR(_str, _strsize, _i) \
92 mbstate_t state_bak; \
96 mblength = mbrlen ((_str) + (_i), (_strsize) - (_i), &state); \
98 if (mblength == (size_t)-2 || mblength == (size_t)-1) \
103 else if (mblength == 0) \
113 # define ADVANCE_CHAR(_str, _strsize, _i) (_i)++
114 #endif /* !HANDLE_MULTIBYTE */
116 /* Advance one (possibly multibyte) character in the string _STR of length
118 SPECIAL: assume that _STR will be incremented by 1 after this call. */
119 #if defined (HANDLE_MULTIBYTE)
120 # define ADVANCE_CHAR_P(_str, _strsize) \
123 if (MB_CUR_MAX > 1) \
125 mbstate_t state_bak; \
129 mblength = mbrlen ((_str), (_strsize), &state); \
131 if (mblength == (size_t)-2 || mblength == (size_t)-1) \
137 (_str) += (mblength < 1) ? 0 : (mblength - 1); \
142 # define ADVANCE_CHAR_P(_str, _strsize)
143 #endif /* !HANDLE_MULTIBYTE */
145 /* Back up one (possibly multi-byte) character in string _STR of length
146 _STRSIZE, starting at index _I. STATE must have already been declared. */
147 #if defined (HANDLE_MULTIBYTE)
148 # define BACKUP_CHAR(_str, _strsize, _i) \
151 if (MB_CUR_MAX > 1) \
153 mbstate_t state_bak; \
155 int _x, _p; /* _x == temp index into string, _p == prev index */ \
161 mblength = mbrlen ((_str) + (_x), (_strsize) - (_x), &state); \
163 if (mblength == (size_t)-2 || mblength == (size_t)-1) \
168 else if (mblength == 0) \
172 _p = _x; /* _p == start of prev mbchar */ \
183 # define BACKUP_CHAR(_str, _strsize, _i) (_i)--
184 #endif /* !HANDLE_MULTIBYTE */
186 /* Back up one (possibly multibyte) character in the string _BASE of length
187 _STRSIZE starting at _STR (_BASE <= _STR <= (_BASE + _STRSIZE) ).
188 SPECIAL: DO NOT assume that _STR will be decremented by 1 after this call. */
189 #if defined (HANDLE_MULTIBYTE)
190 # define BACKUP_CHAR_P(_base, _strsize, _str) \
193 if (MB_CUR_MAX > 1) \
195 mbstate_t state_bak; \
197 char *_x, _p; /* _x == temp pointer into string, _p == prev pointer */ \
200 while (_x < (_str)) \
203 mblength = mbrlen (_x, (_strsize) - _x, &state); \
205 if (mblength == (size_t)-2 || mblength == (size_t)-1) \
210 else if (mblength == 0) \
214 _p = _x; /* _p == start of prev mbchar */ \
225 # define BACKUP_CHAR_P(_base, _strsize, _str) (_str)--
226 #endif /* !HANDLE_MULTIBYTE */
228 /* Copy a single character from the string _SRC to the string _DST.
229 _SRCEND is a pointer to the end of _SRC. */
230 #if defined (HANDLE_MULTIBYTE)
231 # define COPY_CHAR_P(_dst, _src, _srcend) \
234 if (MB_CUR_MAX > 1) \
236 mbstate_t state_bak; \
241 mblength = mbrlen ((_src), (_srcend) - (_src), &state); \
242 if (mblength == (size_t)-2 || mblength == (size_t)-1) \
248 mblength = (mblength < 1) ? 1 : mblength; \
250 for (_k = 0; _k < mblength; _k++) \
251 *(_dst)++ = *(_src)++; \
254 *(_dst)++ = *(_src)++; \
258 # define COPY_CHAR_P(_dst, _src, _srcend) *(_dst)++ = *(_src)++
259 #endif /* !HANDLE_MULTIBYTE */
261 /* Copy a single character from the string _SRC at index _SI to the string
262 _DST at index _DI. _SRCEND is a pointer to the end of _SRC. */
263 #if defined (HANDLE_MULTIBYTE)
264 # define COPY_CHAR_I(_dst, _di, _src, _srcend, _si) \
267 if (MB_CUR_MAX > 1) \
269 mbstate_t state_bak; \
274 mblength = mbrlen ((_src) + (_si), (_srcend) - ((_src)+(_si)), &state); \
275 if (mblength == (size_t)-2 || mblength == (size_t)-1) \
281 mblength = (mblength < 1) ? 1 : mblength; \
283 for (_k = 0; _k < mblength; _k++) \
284 _dst[_di++] = _src[_si++]; \
287 _dst[_di++] = _src[_si++]; \
291 # define COPY_CHAR_I(_dst, _di, _src, _srcend, _si) _dst[_di++] = _src[_si++]
292 #endif /* !HANDLE_MULTIBYTE */
294 /****************************************************************
296 * The following are only guaranteed to work in subst.c *
298 ****************************************************************/
300 #if defined (HANDLE_MULTIBYTE)
301 # define SCOPY_CHAR_I(_dst, _escchar, _sc, _src, _si, _slen) \
304 if (MB_CUR_MAX > 1) \
306 mbstate_t state_bak; \
311 mblength = mbrlen ((_src) + (_si), (_slen) - (_si), &state); \
312 if (mblength == (size_t)-2 || mblength == (size_t)-1) \
318 mblength = (mblength < 1) ? 1 : mblength; \
320 temp = xmalloc (mblength + 2); \
321 temp[0] = _escchar; \
322 for (_i = 0; _i < mblength; _i++) \
323 temp[_i + 1] = _src[_si++]; \
324 temp[mblength + 1] = '\0'; \
330 _dst[0] = _escchar; \
336 # define SCOPY_CHAR_I(_dst, _escchar, _sc, _src, _si, _slen) \
337 _dst[0] = _escchar; \
339 #endif /* !HANDLE_MULTIBYTE */
341 #if defined (HANDLE_MULTIBYTE)
342 # define SCOPY_CHAR_M(_dst, _src, _srcend, _si) \
345 if (MB_CUR_MAX > 1) \
347 mbstate_t state_bak; \
351 mblength = mbrlen ((_src) + (_si), (_srcend) - ((_src) + (_si)), &state); \
352 if (mblength == (size_t)-2 || mblength == (size_t)-1) \
358 mblength = (mblength < 1) ? 1 : mblength; \
360 FASTCOPY(((_src) + (_si)), (_dst), mblength); \
362 (_dst) += mblength; \
367 *(_dst)++ = _src[(_si)]; \
373 # define SCOPY_CHAR_M(_dst, _src, _srcend, _si) \
374 *(_dst)++ = _src[(_si)]; \
376 #endif /* !HANDLE_MULTIBYTE */
379 # define SADD_MBCHAR(_dst, _src, _si, _srcsize) \
382 if (MB_CUR_MAX > 1) \
385 mbstate_t state_bak; \
389 mblength = mbrlen ((_src) + (_si), (_srcsize) - (_si), &state); \
390 if (mblength == (size_t)-1 || mblength == (size_t)-2) \
398 _dst = (char *)xmalloc (mblength + 1); \
399 for (i = 0; i < mblength; i++) \
400 (_dst)[i] = (_src)[(_si)++]; \
401 (_dst)[mblength] = '\0'; \
409 # define SADD_MBCHAR(_dst, _src, _si, _srcsize)
412 /* Watch out when using this -- it's just straight textual subsitution */
413 #if defined (HANDLE_MULTIBYTE)
414 # define SADD_MBQCHAR_BODY(_dst, _src, _si, _srcsize) \
417 mbstate_t state_bak; \
421 mblength = mbrlen ((_src) + (_si), (_srcsize) - (_si), &state); \
422 if (mblength == (size_t)-1 || mblength == (size_t)-2) \
430 (_dst) = (char *)xmalloc (mblength + 2); \
431 (_dst)[0] = CTLESC; \
432 for (i = 0; i < mblength; i++) \
433 (_dst)[i+1] = (_src)[(_si)++]; \
434 (_dst)[mblength+1] = '\0'; \
438 #endif /* HANDLE_MULTIBYTE */
439 #endif /* _SH_MBUTIL_H_ */