1 /* -*- mode: C; c-file-style: "gnu" -*- */
2 /* dbus-string.c String utility class (internal to D-BUS implementation)
4 * Copyright (C) 2002, 2003 Red Hat, Inc.
6 * Licensed under the Academic Free License version 1.2
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; either version 2 of the License, or
11 * (at your option) any later version.
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
18 * You should have received a copy of the GNU General Public License
19 * along with this program; if not, write to the Free Software
20 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
24 #include "dbus-internals.h"
25 #include "dbus-string.h"
26 /* we allow a system header here, for speed/convenience */
28 #include "dbus-marshal.h"
29 #define DBUS_CAN_USE_DBUS_STRING_PRIVATE 1
30 #include "dbus-string-private.h"
33 * @defgroup DBusString string class
34 * @ingroup DBusInternals
35 * @brief DBusString data structure
37 * Types and functions related to DBusString. DBusString is intended
38 * to be a string class that makes it hard to mess up security issues
39 * (and just in general harder to write buggy code). It should be
40 * used (or extended and then used) rather than the libc stuff in
41 * string.h. The string class is a bit inconvenient at spots because
42 * it handles out-of-memory failures and tries to be extra-robust.
44 * A DBusString has a maximum length set at initialization time; this
45 * can be used to ensure that a buffer doesn't get too big. The
46 * _dbus_string_lengthen() method checks for overflow, and for max
47 * length being exceeded.
49 * Try to avoid conversion to a plain C string, i.e. add methods on
50 * the string object instead, only convert to C string when passing
51 * things out to the public API. In particular, no sprintf, strcpy,
52 * strcat, any of that should be used. The GString feature of
53 * accepting negative numbers for "length of string" is also absent,
54 * because it could keep us from detecting bogus huge lengths. i.e. if
55 * we passed in some bogus huge length it would be taken to mean
56 * "current length of string" instead of "broken crack"
60 * @defgroup DBusStringInternals DBusString implementation details
61 * @ingroup DBusInternals
62 * @brief DBusString implementation details
64 * The guts of DBusString.
70 * We allocate 1 byte for nul termination, plus 7 bytes for possible
71 * align_offset, so we always need 8 bytes on top of the string's
72 * length to be in the allocated block.
74 #define ALLOCATION_PADDING 8
77 * This is the maximum max length (and thus also the maximum length)
80 #define MAX_MAX_LENGTH (_DBUS_INT_MAX - ALLOCATION_PADDING)
83 * Checks a bunch of assertions about a string object
85 * @param real the DBusRealString
87 #define DBUS_GENERIC_STRING_PREAMBLE(real) _dbus_assert ((real) != NULL); _dbus_assert (!(real)->invalid); _dbus_assert ((real)->len >= 0); _dbus_assert ((real)->allocated >= 0); _dbus_assert ((real)->max_length >= 0); _dbus_assert ((real)->len <= ((real)->allocated - ALLOCATION_PADDING)); _dbus_assert ((real)->len <= (real)->max_length)
90 * Checks assertions about a string object that needs to be
91 * modifiable - may not be locked or const. Also declares
92 * the "real" variable pointing to DBusRealString.
93 * @param str the string
95 #define DBUS_STRING_PREAMBLE(str) DBusRealString *real = (DBusRealString*) str; \
96 DBUS_GENERIC_STRING_PREAMBLE (real); \
97 _dbus_assert (!(real)->constant); \
98 _dbus_assert (!(real)->locked)
101 * Checks assertions about a string object that may be locked but
102 * can't be const. i.e. a string object that we can free. Also
103 * declares the "real" variable pointing to DBusRealString.
105 * @param str the string
107 #define DBUS_LOCKED_STRING_PREAMBLE(str) DBusRealString *real = (DBusRealString*) str; \
108 DBUS_GENERIC_STRING_PREAMBLE (real); \
109 _dbus_assert (!(real)->constant)
112 * Checks assertions about a string that may be const or locked. Also
113 * declares the "real" variable pointing to DBusRealString.
114 * @param str the string.
116 #define DBUS_CONST_STRING_PREAMBLE(str) const DBusRealString *real = (DBusRealString*) str; \
117 DBUS_GENERIC_STRING_PREAMBLE (real)
122 * @addtogroup DBusString
127 fixup_alignment (DBusRealString *real)
131 unsigned int old_align_offset;
133 /* we have to have extra space in real->allocated for the align offset and nul byte */
134 _dbus_assert (real->len <= real->allocated - ALLOCATION_PADDING);
136 old_align_offset = real->align_offset;
137 real_block = real->str - old_align_offset;
139 aligned = _DBUS_ALIGN_ADDRESS (real_block, 8);
141 real->align_offset = aligned - real_block;
144 if (old_align_offset != real->align_offset)
146 /* Here comes the suck */
147 memmove (real_block + real->align_offset,
148 real_block + old_align_offset,
152 _dbus_assert (real->align_offset < 8);
153 _dbus_assert (_DBUS_ALIGN_ADDRESS (real->str, 8) == real->str);
157 undo_alignment (DBusRealString *real)
159 if (real->align_offset != 0)
161 memmove (real->str - real->align_offset,
165 real->str = real->str - real->align_offset;
166 real->align_offset = 0;
171 * Initializes a string. The maximum length may be _DBUS_INT_MAX for
172 * no maximum. The string starts life with zero length.
173 * The string must eventually be freed with _dbus_string_free().
175 * @todo the max length feature is useless, because it looks to the
176 * app like out of memory, and the app might try to "recover" - but
177 * recovery in this case is impossible, as we can't ever "get more
178 * memory" - so should delete the max length feature I think. Well, at
179 * least there's a strong caveat that it can only be used when
180 * out-of-memory is a permanent fatal error.
182 * @todo we could make this init routine not alloc any memory and
183 * return void, would simplify a lot of code, however it might
184 * complexify things elsewhere because _dbus_string_get_data()
185 * etc. could suddenly fail as they'd need to alloc new memory.
187 * @param str memory to hold the string
188 * @param max_length the maximum size of the string
189 * @returns #TRUE on success */
191 _dbus_string_init (DBusString *str,
194 DBusRealString *real;
196 _dbus_assert (str != NULL);
197 _dbus_assert (max_length >= 0);
199 _dbus_assert (sizeof (DBusString) == sizeof (DBusRealString));
201 real = (DBusRealString*) str;
203 /* It's very important not to touch anything
204 * other than real->str if we're going to fail,
205 * since we also use this function to reset
206 * an existing string, e.g. in _dbus_string_steal_data()
209 real->str = dbus_malloc (ALLOCATION_PADDING);
210 if (real->str == NULL)
213 real->allocated = ALLOCATION_PADDING;
215 real->str[real->len] = '\0';
217 real->max_length = max_length;
218 if (real->max_length > MAX_MAX_LENGTH)
219 real->max_length = MAX_MAX_LENGTH;
220 real->constant = FALSE;
221 real->locked = FALSE;
222 real->invalid = FALSE;
223 real->align_offset = 0;
225 fixup_alignment (real);
231 * Initializes a constant string. The value parameter is not copied
232 * (should be static), and the string may never be modified.
233 * It is safe but not necessary to call _dbus_string_free()
234 * on a const string. The string has a length limit of MAXINT - 8.
236 * @param str memory to use for the string
237 * @param value a string to be stored in str (not copied!!!)
240 _dbus_string_init_const (DBusString *str,
243 _dbus_assert (value != NULL);
245 _dbus_string_init_const_len (str, value,
250 * Initializes a constant string with a length. The value parameter is
251 * not copied (should be static), and the string may never be
252 * modified. It is safe but not necessary to call _dbus_string_free()
255 * @param str memory to use for the string
256 * @param value a string to be stored in str (not copied!!!)
257 * @param len the length to use
260 _dbus_string_init_const_len (DBusString *str,
264 DBusRealString *real;
266 _dbus_assert (str != NULL);
267 _dbus_assert (value != NULL);
268 _dbus_assert (len <= MAX_MAX_LENGTH);
269 _dbus_assert (len >= 0);
271 real = (DBusRealString*) str;
273 real->str = (char*) value;
275 real->allocated = real->len + ALLOCATION_PADDING; /* a lie, just to avoid special-case assertions... */
276 real->max_length = real->len + 1;
277 real->constant = TRUE;
278 real->invalid = FALSE;
280 /* We don't require const strings to be 8-byte aligned as the
281 * memory is coming from elsewhere.
286 * Frees a string created by _dbus_string_init().
288 * @param str memory where the string is stored.
291 _dbus_string_free (DBusString *str)
293 DBusRealString *real = (DBusRealString*) str;
294 DBUS_GENERIC_STRING_PREAMBLE (real);
298 dbus_free (real->str - real->align_offset);
300 real->invalid = TRUE;
304 * Locks a string such that any attempts to change the string will
305 * result in aborting the program. Also, if the string is wasting a
306 * lot of memory (allocation is sufficiently larger than what the
307 * string is really using), _dbus_string_lock() will realloc the
308 * string's data to "compact" it.
310 * @param str the string to lock.
313 _dbus_string_lock (DBusString *str)
315 DBUS_LOCKED_STRING_PREAMBLE (str); /* can lock multiple times */
319 /* Try to realloc to avoid excess memory usage, since
320 * we know we won't change the string further
323 if (real->allocated - MAX_WASTE > real->len)
328 new_allocated = real->len + ALLOCATION_PADDING;
330 new_str = dbus_realloc (real->str - real->align_offset,
334 real->str = new_str + real->align_offset;
335 real->allocated = new_allocated;
336 fixup_alignment (real);
342 set_length (DBusRealString *real,
345 /* Note, we are setting the length without nul termination */
347 /* exceeding max length is the same as failure to allocate memory */
348 if (new_length > real->max_length)
351 if (new_length > (real->allocated - ALLOCATION_PADDING))
356 /* at least double our old allocation to avoid O(n), avoiding
359 if (real->allocated > (MAX_MAX_LENGTH + ALLOCATION_PADDING) / 2)
360 new_allocated = MAX_MAX_LENGTH + ALLOCATION_PADDING;
362 new_allocated = real->allocated * 2;
364 /* But be sure we always alloc at least space for the new length */
365 new_allocated = MAX (real->allocated, new_length + ALLOCATION_PADDING);
367 new_str = dbus_realloc (real->str - real->align_offset, new_allocated);
371 real->str = new_str + real->align_offset;
372 real->allocated = new_allocated;
373 fixup_alignment (real);
376 real->len = new_length;
377 real->str[real->len] = '\0';
384 DBusRealString *dest,
390 if (len > dest->max_length - dest->len)
391 return FALSE; /* detected overflow of dest->len + len below */
393 if (!set_length (dest, dest->len + len))
396 memmove (dest->str + insert_at + len,
397 dest->str + insert_at,
398 dest->len - len - insert_at);
404 * Gets the raw character buffer from the string. The returned buffer
405 * will be nul-terminated, but note that strings may contain binary
406 * data so there may be extra nul characters prior to the termination.
407 * This function should be little-used, extend DBusString or add
408 * stuff to dbus-sysdeps.c instead. It's an error to use this
409 * function on a const string.
411 * @param str the string
412 * @param data_return place to store the returned data
415 _dbus_string_get_data (DBusString *str,
418 DBUS_STRING_PREAMBLE (str);
419 _dbus_assert (data_return != NULL);
421 *data_return = real->str;
425 * Gets the raw character buffer from a const string.
427 * @todo should return the const char* instead of using an out param;
428 * the temporary variable encourages a bug where you use const data
429 * after modifying the string and possibly causing a realloc.
431 * @param str the string
432 * @param data_return location to store returned data
435 _dbus_string_get_const_data (const DBusString *str,
436 const char **data_return)
438 DBUS_CONST_STRING_PREAMBLE (str);
439 _dbus_assert (data_return != NULL);
441 *data_return = real->str;
445 * Gets a sub-portion of the raw character buffer from the
446 * string. The "len" field is required simply for error
447 * checking, to be sure you don't try to use more
448 * string than exists. The nul termination of the
449 * returned buffer remains at the end of the entire
450 * string, not at start + len.
452 * @param str the string
453 * @param data_return location to return the buffer
454 * @param start byte offset to return
455 * @param len length of segment to return
458 _dbus_string_get_data_len (DBusString *str,
463 DBUS_STRING_PREAMBLE (str);
464 _dbus_assert (data_return != NULL);
465 _dbus_assert (start >= 0);
466 _dbus_assert (len >= 0);
467 _dbus_assert (start <= real->len);
468 _dbus_assert (len <= real->len - start);
470 *data_return = real->str + start;
474 * const version of _dbus_string_get_data_len().
476 * @todo should return the const char* instead of using an out param;
477 * the temporary variable encourages a bug where you use const data
478 * after modifying the string and possibly causing a realloc.
480 * @param str the string
481 * @param data_return location to return the buffer
482 * @param start byte offset to return
483 * @param len length of segment to return
486 _dbus_string_get_const_data_len (const DBusString *str,
487 const char **data_return,
491 DBUS_CONST_STRING_PREAMBLE (str);
492 _dbus_assert (data_return != NULL);
493 _dbus_assert (start >= 0);
494 _dbus_assert (len >= 0);
495 _dbus_assert (start <= real->len);
496 _dbus_assert (len <= real->len - start);
498 *data_return = real->str + start;
502 * Sets the value of the byte at the given position.
504 * @param str the string
505 * @param i the position
506 * @param byte the new value
509 _dbus_string_set_byte (DBusString *str,
513 DBUS_STRING_PREAMBLE (str);
514 _dbus_assert (i < real->len);
515 _dbus_assert (i >= 0);
521 * Gets the byte at the given position.
523 * @param str the string
524 * @param start the position
525 * @returns the byte at that position
528 _dbus_string_get_byte (const DBusString *str,
531 DBUS_CONST_STRING_PREAMBLE (str);
532 _dbus_assert (start < real->len);
533 _dbus_assert (start >= 0);
535 return real->str[start];
539 * Inserts the given byte at the given position.
541 * @param str the string
542 * @param i the position
543 * @param byte the value to insert
544 * @returns #TRUE on success
547 _dbus_string_insert_byte (DBusString *str,
551 DBUS_STRING_PREAMBLE (str);
552 _dbus_assert (i <= real->len);
553 _dbus_assert (i >= 0);
555 if (!open_gap (1, real, i))
564 * Like _dbus_string_get_data(), but removes the
565 * gotten data from the original string. The caller
566 * must free the data returned. This function may
567 * fail due to lack of memory, and return #FALSE.
569 * @param str the string
570 * @param data_return location to return the buffer
571 * @returns #TRUE on success
574 _dbus_string_steal_data (DBusString *str,
577 DBUS_STRING_PREAMBLE (str);
578 _dbus_assert (data_return != NULL);
580 undo_alignment (real);
582 *data_return = real->str;
584 /* reset the string */
585 if (!_dbus_string_init (str, real->max_length))
587 /* hrm, put it back then */
588 real->str = *data_return;
590 fixup_alignment (real);
598 * Like _dbus_string_get_data_len(), but removes the gotten data from
599 * the original string. The caller must free the data returned. This
600 * function may fail due to lack of memory, and return #FALSE.
601 * The returned string is nul-terminated and has length len.
603 * @todo this function is broken because on failure it
604 * may corrupt the source string.
606 * @param str the string
607 * @param data_return location to return the buffer
608 * @param start the start of segment to steal
609 * @param len the length of segment to steal
610 * @returns #TRUE on success
613 _dbus_string_steal_data_len (DBusString *str,
620 DBUS_STRING_PREAMBLE (str);
621 _dbus_assert (data_return != NULL);
622 _dbus_assert (start >= 0);
623 _dbus_assert (len >= 0);
624 _dbus_assert (start <= real->len);
625 _dbus_assert (len <= real->len - start);
627 if (!_dbus_string_init (&dest, real->max_length))
630 if (!_dbus_string_move_len (str, start, len, &dest, 0))
632 _dbus_string_free (&dest);
636 _dbus_warn ("Broken code in _dbus_string_steal_data_len(), see @todo, FIXME\n");
637 if (!_dbus_string_steal_data (&dest, data_return))
639 _dbus_string_free (&dest);
643 _dbus_string_free (&dest);
649 * Copies the data from the string into a char*
651 * @param str the string
652 * @param data_return place to return the data
653 * @returns #TRUE on success, #FALSE on no memory
656 _dbus_string_copy_data (const DBusString *str,
659 DBUS_CONST_STRING_PREAMBLE (str);
660 _dbus_assert (data_return != NULL);
662 *data_return = dbus_malloc (real->len + 1);
663 if (*data_return == NULL)
666 memcpy (*data_return, real->str, real->len + 1);
672 * Copies a segment of the string into a char*
674 * @param str the string
675 * @param data_return place to return the data
676 * @param start start index
677 * @param len length to copy
678 * @returns #FALSE if no memory
681 _dbus_string_copy_data_len (const DBusString *str,
688 DBUS_CONST_STRING_PREAMBLE (str);
689 _dbus_assert (data_return != NULL);
690 _dbus_assert (start >= 0);
691 _dbus_assert (len >= 0);
692 _dbus_assert (start <= real->len);
693 _dbus_assert (len <= real->len - start);
695 if (!_dbus_string_init (&dest, real->max_length))
698 if (!_dbus_string_copy_len (str, start, len, &dest, 0))
700 _dbus_string_free (&dest);
704 if (!_dbus_string_steal_data (&dest, data_return))
706 _dbus_string_free (&dest);
710 _dbus_string_free (&dest);
715 * Gets the length of a string (not including nul termination).
717 * @returns the length.
720 _dbus_string_get_length (const DBusString *str)
722 DBUS_CONST_STRING_PREAMBLE (str);
728 * Makes a string longer by the given number of bytes. Checks whether
729 * adding additional_length to the current length would overflow an
730 * integer, and checks for exceeding a string's max length.
731 * The new bytes are not initialized, other than nul-terminating
732 * the end of the string. The uninitialized bytes may contain
733 * nul bytes or other junk.
735 * @param str a string
736 * @param additional_length length to add to the string.
737 * @returns #TRUE on success.
740 _dbus_string_lengthen (DBusString *str,
741 int additional_length)
743 DBUS_STRING_PREAMBLE (str);
744 _dbus_assert (additional_length >= 0);
746 if (additional_length > real->max_length - real->len)
747 return FALSE; /* would overflow */
749 return set_length (real,
750 real->len + additional_length);
754 * Makes a string shorter by the given number of bytes.
756 * @param str a string
757 * @param length_to_remove length to remove from the string.
760 _dbus_string_shorten (DBusString *str,
761 int length_to_remove)
763 DBUS_STRING_PREAMBLE (str);
764 _dbus_assert (length_to_remove >= 0);
765 _dbus_assert (length_to_remove <= real->len);
768 real->len - length_to_remove);
772 * Sets the length of a string. Can be used to truncate or lengthen
773 * the string. If the string is lengthened, the function may fail and
774 * return #FALSE. Newly-added bytes are not initialized, as with
775 * _dbus_string_lengthen().
777 * @param str a string
778 * @param length new length of the string.
779 * @returns #FALSE on failure.
782 _dbus_string_set_length (DBusString *str,
785 DBUS_STRING_PREAMBLE (str);
786 _dbus_assert (length >= 0);
788 return set_length (real, length);
792 * Align the length of a string to a specific alignment (typically 4 or 8)
793 * by appending nul bytes to the string.
795 * @param str a string
796 * @param alignment the alignment
797 * @returns #FALSE if no memory
800 _dbus_string_align_length (DBusString *str,
803 unsigned long new_len; /* ulong to avoid _DBUS_ALIGN_VALUE overflow */
805 DBUS_STRING_PREAMBLE (str);
806 _dbus_assert (alignment >= 1);
807 _dbus_assert (alignment <= 8); /* it has to be a bug if > 8 */
809 new_len = _DBUS_ALIGN_VALUE (real->len, alignment);
810 if (new_len > (unsigned long) real->max_length)
813 delta = new_len - real->len;
814 _dbus_assert (delta >= 0);
819 if (!set_length (real, new_len))
822 memset (real->str + (new_len - delta),
829 append (DBusRealString *real,
836 if (!_dbus_string_lengthen ((DBusString*)real, buffer_len))
839 memcpy (real->str + (real->len - buffer_len),
847 * Appends a nul-terminated C-style string to a DBusString.
849 * @param str the DBusString
850 * @param buffer the nul-terminated characters to append
851 * @returns #FALSE if not enough memory.
854 _dbus_string_append (DBusString *str,
857 unsigned long buffer_len;
859 DBUS_STRING_PREAMBLE (str);
860 _dbus_assert (buffer != NULL);
862 buffer_len = strlen (buffer);
863 if (buffer_len > (unsigned long) real->max_length)
866 return append (real, buffer, buffer_len);
870 * Appends block of bytes with the given length to a DBusString.
872 * @param str the DBusString
873 * @param buffer the bytes to append
874 * @param len the number of bytes to append
875 * @returns #FALSE if not enough memory.
878 _dbus_string_append_len (DBusString *str,
882 DBUS_STRING_PREAMBLE (str);
883 _dbus_assert (buffer != NULL);
884 _dbus_assert (len >= 0);
886 return append (real, buffer, len);
890 * Appends a single byte to the string, returning #FALSE
891 * if not enough memory.
893 * @param str the string
894 * @param byte the byte to append
895 * @returns #TRUE on success
898 _dbus_string_append_byte (DBusString *str,
901 DBUS_STRING_PREAMBLE (str);
903 if (!set_length (real, real->len + 1))
906 real->str[real->len-1] = byte;
912 * Appends a single Unicode character, encoding the character
915 * @param str the string
916 * @param ch the Unicode character
919 _dbus_string_append_unichar (DBusString *str,
927 DBUS_STRING_PREAMBLE (str);
929 /* this code is from GLib but is pretty standard I think */
943 else if (ch < 0x10000)
948 else if (ch < 0x200000)
953 else if (ch < 0x4000000)
964 if (len > (real->max_length - real->len))
965 return FALSE; /* real->len + len would overflow */
967 if (!set_length (real, real->len + len))
970 out = real->str + (real->len - len);
972 for (i = len - 1; i > 0; --i)
974 out[i] = (ch & 0x3f) | 0x80;
983 delete (DBusRealString *real,
990 memmove (real->str + start, real->str + start + len, real->len - (start + len));
992 real->str[real->len] = '\0';
996 * Deletes a segment of a DBusString with length len starting at
997 * start. (Hint: to clear an entire string, setting length to 0
998 * with _dbus_string_set_length() is easier.)
1000 * @param str the DBusString
1001 * @param start where to start deleting
1002 * @param len the number of bytes to delete
1005 _dbus_string_delete (DBusString *str,
1009 DBUS_STRING_PREAMBLE (str);
1010 _dbus_assert (start >= 0);
1011 _dbus_assert (len >= 0);
1012 _dbus_assert (start <= real->len);
1013 _dbus_assert (len <= real->len - start);
1015 delete (real, start, len);
1019 copy (DBusRealString *source,
1022 DBusRealString *dest,
1028 if (!open_gap (len, dest, insert_at))
1031 memcpy (dest->str + insert_at,
1032 source->str + start,
1039 * Checks assertions for two strings we're copying a segment between,
1040 * and declares real_source/real_dest variables.
1042 * @param source the source string
1043 * @param start the starting offset
1044 * @param dest the dest string
1045 * @param insert_at where the copied segment is inserted
1047 #define DBUS_STRING_COPY_PREAMBLE(source, start, dest, insert_at) \
1048 DBusRealString *real_source = (DBusRealString*) source; \
1049 DBusRealString *real_dest = (DBusRealString*) dest; \
1050 _dbus_assert ((source) != (dest)); \
1051 DBUS_GENERIC_STRING_PREAMBLE (real_source); \
1052 DBUS_GENERIC_STRING_PREAMBLE (real_dest); \
1053 _dbus_assert (!real_dest->constant); \
1054 _dbus_assert (!real_dest->locked); \
1055 _dbus_assert ((start) >= 0); \
1056 _dbus_assert ((start) <= real_source->len); \
1057 _dbus_assert ((insert_at) >= 0); \
1058 _dbus_assert ((insert_at) <= real_dest->len)
1061 * Moves the end of one string into another string. Both strings
1062 * must be initialized, valid strings.
1064 * @param source the source string
1065 * @param start where to chop off the source string
1066 * @param dest the destination string
1067 * @param insert_at where to move the chopped-off part of source string
1068 * @returns #FALSE if not enough memory
1071 _dbus_string_move (DBusString *source,
1076 DBUS_STRING_COPY_PREAMBLE (source, start, dest, insert_at);
1078 if (!copy (real_source, start,
1079 real_source->len - start,
1084 delete (real_source, start,
1085 real_source->len - start);
1091 * Like _dbus_string_move(), but does not delete the section
1092 * of the source string that's copied to the dest string.
1094 * @param source the source string
1095 * @param start where to start copying the source string
1096 * @param dest the destination string
1097 * @param insert_at where to place the copied part of source string
1098 * @returns #FALSE if not enough memory
1101 _dbus_string_copy (const DBusString *source,
1106 DBUS_STRING_COPY_PREAMBLE (source, start, dest, insert_at);
1108 return copy (real_source, start,
1109 real_source->len - start,
1115 * Like _dbus_string_move(), but can move a segment from
1116 * the middle of the source string.
1118 * @param source the source string
1119 * @param start first byte of source string to move
1120 * @param len length of segment to move
1121 * @param dest the destination string
1122 * @param insert_at where to move the bytes from the source string
1123 * @returns #FALSE if not enough memory
1126 _dbus_string_move_len (DBusString *source,
1133 DBUS_STRING_COPY_PREAMBLE (source, start, dest, insert_at);
1134 _dbus_assert (len >= 0);
1135 _dbus_assert ((start + len) <= real_source->len);
1137 if (!copy (real_source, start, len,
1142 delete (real_source, start,
1149 * Like _dbus_string_copy(), but can copy a segment from the middle of
1150 * the source string.
1152 * @param source the source string
1153 * @param start where to start copying the source string
1154 * @param len length of segment to copy
1155 * @param dest the destination string
1156 * @param insert_at where to place the copied segment of source string
1157 * @returns #FALSE if not enough memory
1160 _dbus_string_copy_len (const DBusString *source,
1166 DBUS_STRING_COPY_PREAMBLE (source, start, dest, insert_at);
1167 _dbus_assert (len >= 0);
1168 _dbus_assert (start <= real_source->len);
1169 _dbus_assert (len <= real_source->len - start);
1171 return copy (real_source, start, len,
1177 * Replaces a segment of dest string with a segment of source string.
1179 * @todo optimize the case where the two lengths are the same, and
1180 * avoid memmoving the data in the trailing part of the string twice.
1182 * @todo avoid inserting the source into dest, then deleting
1183 * the replaced chunk of dest (which creates a potentially large
1184 * intermediate string). Instead, extend the replaced chunk
1185 * of dest with padding to the same size as the source chunk,
1186 * then copy in the source bytes.
1188 * @param source the source string
1189 * @param start where to start copying the source string
1190 * @param len length of segment to copy
1191 * @param dest the destination string
1192 * @param replace_at start of segment of dest string to replace
1193 * @param replace_len length of segment of dest string to replace
1194 * @returns #FALSE if not enough memory
1198 _dbus_string_replace_len (const DBusString *source,
1205 DBUS_STRING_COPY_PREAMBLE (source, start, dest, replace_at);
1206 _dbus_assert (len >= 0);
1207 _dbus_assert (start <= real_source->len);
1208 _dbus_assert (len <= real_source->len - start);
1209 _dbus_assert (replace_at >= 0);
1210 _dbus_assert (replace_at <= real_dest->len);
1211 _dbus_assert (replace_len <= real_dest->len - replace_at);
1213 if (!copy (real_source, start, len,
1214 real_dest, replace_at))
1217 delete (real_dest, replace_at + len, replace_len);
1222 /* Unicode macros and utf8_validate() from GLib Owen Taylor, Havoc
1223 * Pennington, and Tom Tromey are the authors and authorized relicense.
1226 /** computes length and mask of a unicode character
1227 * @param Char the char
1228 * @param Mask the mask variable to assign to
1229 * @param Len the length variable to assign to
1231 #define UTF8_COMPUTE(Char, Mask, Len) \
1237 else if ((Char & 0xe0) == 0xc0) \
1242 else if ((Char & 0xf0) == 0xe0) \
1247 else if ((Char & 0xf8) == 0xf0) \
1252 else if ((Char & 0xfc) == 0xf8) \
1257 else if ((Char & 0xfe) == 0xfc) \
1266 * computes length of a unicode character in UTF-8
1267 * @param Char the char
1269 #define UTF8_LENGTH(Char) \
1270 ((Char) < 0x80 ? 1 : \
1271 ((Char) < 0x800 ? 2 : \
1272 ((Char) < 0x10000 ? 3 : \
1273 ((Char) < 0x200000 ? 4 : \
1274 ((Char) < 0x4000000 ? 5 : 6)))))
1277 * Gets a UTF-8 value.
1279 * @param Result variable for extracted unicode char.
1280 * @param Chars the bytes to decode
1281 * @param Count counter variable
1282 * @param Mask mask for this char
1283 * @param Len length for this char in bytes
1285 #define UTF8_GET(Result, Chars, Count, Mask, Len) \
1286 (Result) = (Chars)[0] & (Mask); \
1287 for ((Count) = 1; (Count) < (Len); ++(Count)) \
1289 if (((Chars)[(Count)] & 0xc0) != 0x80) \
1295 (Result) |= ((Chars)[(Count)] & 0x3f); \
1299 * Check whether a unicode char is in a valid range.
1301 * @param Char the character
1303 #define UNICODE_VALID(Char) \
1304 ((Char) < 0x110000 && \
1305 (((Char) & 0xFFFFF800) != 0xD800) && \
1306 ((Char) < 0xFDD0 || (Char) > 0xFDEF) && \
1307 ((Char) & 0xFFFF) != 0xFFFF)
1310 * Gets a unicode character from a UTF-8 string. Does no validation;
1311 * you must verify that the string is valid UTF-8 in advance and must
1312 * pass in the start of a character.
1314 * @param str the string
1315 * @param start the start of the UTF-8 character.
1316 * @param ch_return location to return the character
1317 * @param end_return location to return the byte index of next character
1320 _dbus_string_get_unichar (const DBusString *str,
1322 dbus_unichar_t *ch_return,
1326 dbus_unichar_t result;
1329 DBUS_CONST_STRING_PREAMBLE (str);
1330 _dbus_assert (start >= 0);
1331 _dbus_assert (start <= real->len);
1336 *end_return = real->len;
1339 p = real->str + start;
1342 UTF8_COMPUTE (c, mask, len);
1345 UTF8_GET (result, p, i, mask, len);
1347 if (result == (dbus_unichar_t)-1)
1351 *ch_return = result;
1353 *end_return = start + len;
1357 * Finds the given substring in the string,
1358 * returning #TRUE and filling in the byte index
1359 * where the substring was found, if it was found.
1360 * Returns #FALSE if the substring wasn't found.
1361 * Sets *start to the length of the string if the substring
1364 * @param str the string
1365 * @param start where to start looking
1366 * @param substr the substring
1367 * @param found return location for where it was found, or #NULL
1368 * @returns #TRUE if found
1371 _dbus_string_find (const DBusString *str,
1376 return _dbus_string_find_to (str, start,
1377 ((const DBusRealString*)str)->len,
1382 * Finds the given substring in the string,
1383 * up to a certain position,
1384 * returning #TRUE and filling in the byte index
1385 * where the substring was found, if it was found.
1386 * Returns #FALSE if the substring wasn't found.
1387 * Sets *start to the length of the string if the substring
1390 * @param str the string
1391 * @param start where to start looking
1392 * @param end where to stop looking
1393 * @param substr the substring
1394 * @param found return location for where it was found, or #NULL
1395 * @returns #TRUE if found
1398 _dbus_string_find_to (const DBusString *str,
1405 DBUS_CONST_STRING_PREAMBLE (str);
1406 _dbus_assert (substr != NULL);
1407 _dbus_assert (start <= real->len);
1408 _dbus_assert (start >= 0);
1409 _dbus_assert (substr != NULL);
1410 _dbus_assert (end <= real->len);
1411 _dbus_assert (start <= end);
1413 /* we always "find" an empty string */
1414 if (*substr == '\0')
1424 if (real->str[i] == substr[0])
1430 if (substr[j - i] == '\0')
1432 else if (real->str[j] != substr[j - i])
1438 if (substr[j - i] == '\0')
1456 * Finds a blank (space or tab) in the string. Returns #TRUE
1457 * if found, #FALSE otherwise. If a blank is not found sets
1458 * *found to the length of the string.
1460 * @param str the string
1461 * @param start byte index to start looking
1462 * @param found place to store the location of the first blank
1463 * @returns #TRUE if a blank was found
1466 _dbus_string_find_blank (const DBusString *str,
1471 DBUS_CONST_STRING_PREAMBLE (str);
1472 _dbus_assert (start <= real->len);
1473 _dbus_assert (start >= 0);
1476 while (i < real->len)
1478 if (real->str[i] == ' ' ||
1479 real->str[i] == '\t')
1496 * Skips blanks from start, storing the first non-blank in *end
1497 * (blank is space or tab).
1499 * @param str the string
1500 * @param start where to start
1501 * @param end where to store the first non-blank byte index
1504 _dbus_string_skip_blank (const DBusString *str,
1509 DBUS_CONST_STRING_PREAMBLE (str);
1510 _dbus_assert (start <= real->len);
1511 _dbus_assert (start >= 0);
1514 while (i < real->len)
1516 if (!(real->str[i] == ' ' ||
1517 real->str[i] == '\t'))
1523 _dbus_assert (i == real->len || !(real->str[i] == ' ' ||
1524 real->str[i] == '\t'));
1531 * Skips whitespace from start, storing the first non-whitespace in *end.
1532 * (whitespace is space, tab, newline, CR).
1534 * @param str the string
1535 * @param start where to start
1536 * @param end where to store the first non-whitespace byte index
1539 _dbus_string_skip_white (const DBusString *str,
1544 DBUS_CONST_STRING_PREAMBLE (str);
1545 _dbus_assert (start <= real->len);
1546 _dbus_assert (start >= 0);
1549 while (i < real->len)
1551 if (!(real->str[i] == ' ' ||
1552 real->str[i] == '\n' ||
1553 real->str[i] == '\r' ||
1554 real->str[i] == '\t'))
1560 _dbus_assert (i == real->len || !(real->str[i] == ' ' ||
1561 real->str[i] == '\t'));
1568 * Assigns a newline-terminated or \r\n-terminated line from the front
1569 * of the string to the given dest string. The dest string's previous
1570 * contents are deleted. If the source string contains no newline,
1571 * moves the entire source string to the dest string.
1573 * @todo owen correctly notes that this is a stupid function (it was
1574 * written purely for test code,
1575 * e.g. dbus-message-builder.c). Probably should be enforced as test
1576 * code only with #ifdef DBUS_BUILD_TESTS
1578 * @param source the source string
1579 * @param dest the destination string (contents are replaced)
1580 * @returns #FALSE if no memory, or source has length 0
1583 _dbus_string_pop_line (DBusString *source,
1587 dbus_bool_t have_newline;
1589 _dbus_string_set_length (dest, 0);
1592 if (_dbus_string_find (source, 0, "\n", &eol))
1594 have_newline = TRUE;
1595 eol += 1; /* include newline */
1599 eol = _dbus_string_get_length (source);
1600 have_newline = FALSE;
1604 return FALSE; /* eof */
1606 if (!_dbus_string_move_len (source, 0, eol,
1612 /* dump the newline and the \r if we have one */
1615 dbus_bool_t have_cr;
1617 _dbus_assert (_dbus_string_get_length (dest) > 0);
1619 if (_dbus_string_get_length (dest) > 1 &&
1620 _dbus_string_get_byte (dest,
1621 _dbus_string_get_length (dest) - 2) == '\r')
1626 _dbus_string_set_length (dest,
1627 _dbus_string_get_length (dest) -
1635 * Deletes up to and including the first blank space
1638 * @param str the string
1641 _dbus_string_delete_first_word (DBusString *str)
1645 if (_dbus_string_find_blank (str, 0, &i))
1646 _dbus_string_skip_blank (str, i, &i);
1648 _dbus_string_delete (str, 0, i);
1652 * Deletes any leading blanks in the string
1654 * @param str the string
1657 _dbus_string_delete_leading_blanks (DBusString *str)
1661 _dbus_string_skip_blank (str, 0, &i);
1664 _dbus_string_delete (str, 0, i);
1668 * Tests two DBusString for equality.
1670 * @todo memcmp is probably faster
1672 * @param a first string
1673 * @param b second string
1674 * @returns #TRUE if equal
1677 _dbus_string_equal (const DBusString *a,
1678 const DBusString *b)
1680 const unsigned char *ap;
1681 const unsigned char *bp;
1682 const unsigned char *a_end;
1683 const DBusRealString *real_a = (const DBusRealString*) a;
1684 const DBusRealString *real_b = (const DBusRealString*) b;
1685 DBUS_GENERIC_STRING_PREAMBLE (real_a);
1686 DBUS_GENERIC_STRING_PREAMBLE (real_b);
1688 if (real_a->len != real_b->len)
1693 a_end = real_a->str + real_a->len;
1707 * Tests two DBusString for equality up to the given length.
1709 * @todo write a unit test
1711 * @todo memcmp is probably faster
1713 * @param a first string
1714 * @param b second string
1715 * @param len the lengh
1716 * @returns #TRUE if equal for the given number of bytes
1719 _dbus_string_equal_len (const DBusString *a,
1720 const DBusString *b,
1723 const unsigned char *ap;
1724 const unsigned char *bp;
1725 const unsigned char *a_end;
1726 const DBusRealString *real_a = (const DBusRealString*) a;
1727 const DBusRealString *real_b = (const DBusRealString*) b;
1728 DBUS_GENERIC_STRING_PREAMBLE (real_a);
1729 DBUS_GENERIC_STRING_PREAMBLE (real_b);
1731 if (real_a->len != real_b->len &&
1732 (real_a->len < len || real_b->len < len))
1737 a_end = real_a->str + MIN (real_a->len, len);
1751 * Checks whether a string is equal to a C string.
1753 * @param a the string
1754 * @param c_str the C string
1755 * @returns #TRUE if equal
1758 _dbus_string_equal_c_str (const DBusString *a,
1761 const unsigned char *ap;
1762 const unsigned char *bp;
1763 const unsigned char *a_end;
1764 const DBusRealString *real_a = (const DBusRealString*) a;
1765 DBUS_GENERIC_STRING_PREAMBLE (real_a);
1766 _dbus_assert (c_str != NULL);
1769 bp = (const unsigned char*) c_str;
1770 a_end = real_a->str + real_a->len;
1771 while (ap != a_end && *bp)
1780 if (ap != a_end || *bp)
1787 * Checks whether a string starts with the given C string.
1789 * @param a the string
1790 * @param c_str the C string
1791 * @returns #TRUE if string starts with it
1794 _dbus_string_starts_with_c_str (const DBusString *a,
1797 const unsigned char *ap;
1798 const unsigned char *bp;
1799 const unsigned char *a_end;
1800 const DBusRealString *real_a = (const DBusRealString*) a;
1801 DBUS_GENERIC_STRING_PREAMBLE (real_a);
1802 _dbus_assert (c_str != NULL);
1805 bp = (const unsigned char*) c_str;
1806 a_end = real_a->str + real_a->len;
1807 while (ap != a_end && *bp)
1823 * Returns whether a string ends with the given suffix
1825 * @todo memcmp might make this faster.
1827 * @param a the string
1828 * @param c_str the C-style string
1829 * @returns #TRUE if the string ends with the suffix
1832 _dbus_string_ends_with_c_str (const DBusString *a,
1835 const unsigned char *ap;
1836 const unsigned char *bp;
1837 const unsigned char *a_end;
1838 unsigned long c_str_len;
1839 const DBusRealString *real_a = (const DBusRealString*) a;
1840 DBUS_GENERIC_STRING_PREAMBLE (real_a);
1841 _dbus_assert (c_str != NULL);
1843 c_str_len = strlen (c_str);
1844 if (((unsigned long)real_a->len) < c_str_len)
1847 ap = real_a->str + (real_a->len - c_str_len);
1848 bp = (const unsigned char*) c_str;
1849 a_end = real_a->str + real_a->len;
1859 _dbus_assert (*ap == '\0');
1860 _dbus_assert (*bp == '\0');
1865 static const signed char base64_table[] = {
1932 /** The minimum char that's a valid char in Base64-encoded text */
1933 #define UNBASE64_MIN_CHAR (43)
1934 /** The maximum char that's a valid char in Base64-encoded text */
1935 #define UNBASE64_MAX_CHAR (122)
1936 /** Must subtract this from a char's integer value before offsetting
1937 * into unbase64_table
1939 #define UNBASE64_TABLE_OFFSET UNBASE64_MIN_CHAR
1940 static const signed char unbase64_table[] = {
2024 * Encodes a string using Base64, as documented in RFC 2045.
2026 * @param source the string to encode
2027 * @param start byte index to start encoding
2028 * @param dest string where encoded data should be placed
2029 * @param insert_at where to place encoded data
2030 * @returns #TRUE if encoding was successful, #FALSE if no memory etc.
2033 _dbus_string_base64_encode (const DBusString *source,
2039 unsigned int dest_len; /* unsigned for overflow checks below */
2040 const unsigned char *s;
2042 const unsigned char *triplet_end;
2043 const unsigned char *final_end;
2044 DBUS_STRING_COPY_PREAMBLE (source, start, dest, insert_at);
2045 _dbus_assert (source != dest);
2047 /* For each 24 bits (3 bytes) of input, we have 4 bytes of
2050 source_len = real_source->len - start;
2051 dest_len = (source_len / 3) * 4;
2052 if (source_len % 3 != 0)
2055 if (dest_len > (unsigned int) real_dest->max_length)
2058 if (source_len == 0)
2061 if (!open_gap (dest_len, real_dest, insert_at))
2064 d = real_dest->str + insert_at;
2065 s = real_source->str + start;
2066 final_end = real_source->str + (start + source_len);
2067 triplet_end = final_end - (source_len % 3);
2068 _dbus_assert (triplet_end <= final_end);
2069 _dbus_assert ((final_end - triplet_end) < 3);
2071 #define ENCODE_64(v) (base64_table[ (unsigned char) (v) ])
2072 #define SIX_BITS_MASK (0x3f)
2073 _dbus_assert (SIX_BITS_MASK < _DBUS_N_ELEMENTS (base64_table));
2075 while (s != triplet_end)
2077 unsigned int triplet;
2079 triplet = s[2] | (s[1] << 8) | (s[0] << 16);
2081 /* Encode each 6 bits. */
2083 *d++ = ENCODE_64 (triplet >> 18);
2084 *d++ = ENCODE_64 ((triplet >> 12) & SIX_BITS_MASK);
2085 *d++ = ENCODE_64 ((triplet >> 6) & SIX_BITS_MASK);
2086 *d++ = ENCODE_64 (triplet & SIX_BITS_MASK);
2091 switch (final_end - triplet_end)
2095 unsigned int doublet;
2097 doublet = s[1] | (s[0] << 8);
2099 *d++ = ENCODE_64 (doublet >> 12);
2100 *d++ = ENCODE_64 ((doublet >> 6) & SIX_BITS_MASK);
2101 *d++ = ENCODE_64 (doublet & SIX_BITS_MASK);
2107 unsigned int singlet;
2111 *d++ = ENCODE_64 ((singlet >> 6) & SIX_BITS_MASK);
2112 *d++ = ENCODE_64 (singlet & SIX_BITS_MASK);
2121 _dbus_assert (d == (real_dest->str + (insert_at + dest_len)));
2127 * Decodes a string from Base64, as documented in RFC 2045.
2129 * @todo sort out the AUDIT comment in here. The case it mentions
2130 * ("====" or "x===") is not allowed in correct base64, so need to
2131 * decide what to do with that kind of input. Probably ignore it
2132 * since we ignore any other junk seen.
2134 * @param source the string to decode
2135 * @param start byte index to start decode
2136 * @param dest string where decoded data should be placed
2137 * @param insert_at where to place decoded data
2138 * @returns #TRUE if decoding was successful, #FALSE if no memory etc.
2141 _dbus_string_base64_decode (const DBusString *source,
2150 unsigned int triplet = 0;
2153 DBUS_STRING_COPY_PREAMBLE (source, start, dest, insert_at);
2154 _dbus_assert (source != dest);
2156 source_len = real_source->len - start;
2157 s = real_source->str + start;
2158 end = real_source->str + source_len;
2160 if (source_len == 0)
2163 if (!_dbus_string_init (&result, _DBUS_INT_MAX))
2170 /* The idea is to just skip anything that isn't
2171 * a base64 char - it's allowed to have whitespace,
2172 * newlines, etc. in here. We also ignore trailing
2173 * base64 chars, though that's suspicious.
2176 if (*s >= UNBASE64_MIN_CHAR &&
2177 *s <= UNBASE64_MAX_CHAR)
2181 /* '=' is padding, doesn't represent additional data
2182 * but does increment our count.
2191 val = unbase64_table[(*s) - UNBASE64_TABLE_OFFSET];
2196 triplet |= (unsigned int) val;
2201 if (sextet_count == 4)
2203 /* no pad = 3 bytes, 1 pad = 2 bytes, 2 pad = 1 byte */
2206 /* AUDIT: Comment doesn't mention 4 pad => 0,
2207 * 3 pad => 1 byte, though the code should
2208 * work fine if those are the required outputs.
2210 * I assume that the spec requires dropping
2211 * the top two bits of, say, ///= which is > 2
2212 * bytes worth of bits. (Or otherwise, you couldn't
2213 * actually represent 2 byte sequences.
2218 if (!_dbus_string_append_byte (&result,
2225 if (!_dbus_string_append_byte (&result,
2226 (triplet >> 8) & 0xff))
2230 if (!_dbus_string_append_byte (&result,
2243 if (!_dbus_string_move (&result, 0, dest, insert_at))
2245 _dbus_string_free (&result);
2249 _dbus_string_free (&result);
2254 _dbus_string_free (&result);
2260 * Encodes a string in hex, the way MD5 and SHA-1 are usually
2261 * encoded. (Each byte is two hex digits.)
2263 * @param source the string to encode
2264 * @param start byte index to start encoding
2265 * @param dest string where encoded data should be placed
2266 * @param insert_at where to place encoded data
2267 * @returns #TRUE if encoding was successful, #FALSE if no memory etc.
2270 _dbus_string_hex_encode (const DBusString *source,
2276 const char hexdigits[16] = {
2277 '0', '1', '2', '3', '4', '5', '6', '7', '8', '9',
2278 'a', 'b', 'c', 'd', 'e', 'f'
2280 const unsigned char *p;
2281 const unsigned char *end;
2284 _dbus_assert (start <= _dbus_string_get_length (source));
2286 if (!_dbus_string_init (&result, _DBUS_INT_MAX))
2291 _dbus_string_get_const_data (source, (const char**) &p);
2292 end = p + _dbus_string_get_length (source);
2297 if (!_dbus_string_append_byte (&result,
2298 hexdigits[(*p >> 4)]))
2301 if (!_dbus_string_append_byte (&result,
2302 hexdigits[(*p & 0x0f)]))
2308 if (!_dbus_string_move (&result, 0, dest, insert_at))
2314 _dbus_string_free (&result);
2319 * Decodes a string from hex encoding.
2321 * @param source the string to decode
2322 * @param start byte index to start decode
2323 * @param dest string where decoded data should be placed
2324 * @param insert_at where to place decoded data
2325 * @returns #TRUE if decoding was successful, #FALSE if no memory etc.
2328 _dbus_string_hex_decode (const DBusString *source,
2334 const unsigned char *p;
2335 const unsigned char *end;
2337 dbus_bool_t high_bits;
2339 _dbus_assert (start <= _dbus_string_get_length (source));
2341 if (!_dbus_string_init (&result, _DBUS_INT_MAX))
2347 _dbus_string_get_const_data (source, (const char**) &p);
2348 end = p + _dbus_string_get_length (source);
2413 _dbus_verbose ("invalid character '%c' in hex encoded text\n",
2420 if (!_dbus_string_append_byte (&result,
2429 len = _dbus_string_get_length (&result);
2431 b = _dbus_string_get_byte (&result, len - 1);
2435 _dbus_string_set_byte (&result, len - 1, b);
2438 high_bits = !high_bits;
2443 if (!_dbus_string_move (&result, 0, dest, insert_at))
2449 _dbus_string_free (&result);
2454 * Checks that the given range of the string is valid ASCII with no
2455 * nul bytes. If the given range is not entirely contained in the
2456 * string, returns #FALSE.
2458 * @todo this is inconsistent with most of DBusString in that
2459 * it allows a start,len range that isn't in the string.
2461 * @param str the string
2462 * @param start first byte index to check
2463 * @param len number of bytes to check
2464 * @returns #TRUE if the byte range exists and is all valid ASCII
2467 _dbus_string_validate_ascii (const DBusString *str,
2471 const unsigned char *s;
2472 const unsigned char *end;
2473 DBUS_CONST_STRING_PREAMBLE (str);
2474 _dbus_assert (start >= 0);
2475 _dbus_assert (start <= real->len);
2476 _dbus_assert (len >= 0);
2478 if (len > real->len - start)
2481 s = real->str + start;
2486 ((*s & ~0x7f) != 0))
2496 * Checks that the given range of the string is valid UTF-8. If the
2497 * given range is not entirely contained in the string, returns
2498 * #FALSE. If the string contains any nul bytes in the given range,
2499 * returns #FALSE. If the start and start+len are not on character
2500 * boundaries, returns #FALSE.
2502 * @todo this is inconsistent with most of DBusString in that
2503 * it allows a start,len range that isn't in the string.
2505 * @param str the string
2506 * @param start first byte index to check
2507 * @param len number of bytes to check
2508 * @returns #TRUE if the byte range exists and is all valid UTF-8
2511 _dbus_string_validate_utf8 (const DBusString *str,
2515 const unsigned char *p;
2516 const unsigned char *end;
2517 DBUS_CONST_STRING_PREAMBLE (str);
2518 _dbus_assert (start >= 0);
2519 _dbus_assert (start <= real->len);
2520 _dbus_assert (len >= 0);
2522 if (len > real->len - start)
2525 p = real->str + start;
2530 int i, mask = 0, char_len;
2531 dbus_unichar_t result;
2532 unsigned char c = (unsigned char) *p;
2534 UTF8_COMPUTE (c, mask, char_len);
2539 /* check that the expected number of bytes exists in the remaining length */
2540 if ((end - p) < char_len)
2543 UTF8_GET (result, p, i, mask, char_len);
2545 if (UTF8_LENGTH (result) != char_len) /* Check for overlong UTF-8 */
2548 if (result == (dbus_unichar_t)-1)
2551 if (!UNICODE_VALID (result))
2557 /* See that we covered the entire length if a length was
2567 * Checks that the given range of the string is all nul bytes. If the
2568 * given range is not entirely contained in the string, returns
2571 * @todo this is inconsistent with most of DBusString in that
2572 * it allows a start,len range that isn't in the string.
2574 * @param str the string
2575 * @param start first byte index to check
2576 * @param len number of bytes to check
2577 * @returns #TRUE if the byte range exists and is all nul bytes
2580 _dbus_string_validate_nul (const DBusString *str,
2584 const unsigned char *s;
2585 const unsigned char *end;
2586 DBUS_CONST_STRING_PREAMBLE (str);
2587 _dbus_assert (start >= 0);
2588 _dbus_assert (len >= 0);
2589 _dbus_assert (start <= real->len);
2591 if (len > real->len - start)
2594 s = real->str + start;
2607 * Clears all allocated bytes in the string to zero.
2609 * @param str the string
2612 _dbus_string_zero (DBusString *str)
2614 DBUS_STRING_PREAMBLE (str);
2616 memset (real->str, '\0', real->allocated);
2620 #ifdef DBUS_BUILD_TESTS
2621 #include "dbus-test.h"
2625 test_max_len (DBusString *str,
2630 if (!_dbus_string_set_length (str, max_len - 1))
2631 _dbus_assert_not_reached ("setting len to one less than max should have worked");
2634 if (!_dbus_string_set_length (str, max_len))
2635 _dbus_assert_not_reached ("setting len to max len should have worked");
2637 if (_dbus_string_set_length (str, max_len + 1))
2638 _dbus_assert_not_reached ("setting len to one more than max len should not have worked");
2640 if (!_dbus_string_set_length (str, 0))
2641 _dbus_assert_not_reached ("setting len to zero should have worked");
2645 test_base64_roundtrip (const unsigned char *data,
2653 len = strlen (data);
2655 if (!_dbus_string_init (&orig, _DBUS_INT_MAX))
2656 _dbus_assert_not_reached ("could not init string");
2658 if (!_dbus_string_init (&encoded, _DBUS_INT_MAX))
2659 _dbus_assert_not_reached ("could not init string");
2661 if (!_dbus_string_init (&decoded, _DBUS_INT_MAX))
2662 _dbus_assert_not_reached ("could not init string");
2664 if (!_dbus_string_append_len (&orig, data, len))
2665 _dbus_assert_not_reached ("couldn't append orig data");
2667 if (!_dbus_string_base64_encode (&orig, 0, &encoded, 0))
2668 _dbus_assert_not_reached ("could not encode");
2670 if (!_dbus_string_base64_decode (&encoded, 0, &decoded, 0))
2671 _dbus_assert_not_reached ("could not decode");
2673 if (!_dbus_string_equal (&orig, &decoded))
2677 printf ("Original string %d bytes encoded %d bytes decoded %d bytes\n",
2678 _dbus_string_get_length (&orig),
2679 _dbus_string_get_length (&encoded),
2680 _dbus_string_get_length (&decoded));
2681 printf ("Original: %s\n", data);
2682 _dbus_string_get_const_data (&decoded, &s);
2683 printf ("Decoded: %s\n", s);
2684 _dbus_assert_not_reached ("original string not the same as string decoded from base64");
2687 _dbus_string_free (&orig);
2688 _dbus_string_free (&encoded);
2689 _dbus_string_free (&decoded);
2693 test_hex_roundtrip (const unsigned char *data,
2701 len = strlen (data);
2703 if (!_dbus_string_init (&orig, _DBUS_INT_MAX))
2704 _dbus_assert_not_reached ("could not init string");
2706 if (!_dbus_string_init (&encoded, _DBUS_INT_MAX))
2707 _dbus_assert_not_reached ("could not init string");
2709 if (!_dbus_string_init (&decoded, _DBUS_INT_MAX))
2710 _dbus_assert_not_reached ("could not init string");
2712 if (!_dbus_string_append_len (&orig, data, len))
2713 _dbus_assert_not_reached ("couldn't append orig data");
2715 if (!_dbus_string_hex_encode (&orig, 0, &encoded, 0))
2716 _dbus_assert_not_reached ("could not encode");
2718 if (!_dbus_string_hex_decode (&encoded, 0, &decoded, 0))
2719 _dbus_assert_not_reached ("could not decode");
2721 if (!_dbus_string_equal (&orig, &decoded))
2725 printf ("Original string %d bytes encoded %d bytes decoded %d bytes\n",
2726 _dbus_string_get_length (&orig),
2727 _dbus_string_get_length (&encoded),
2728 _dbus_string_get_length (&decoded));
2729 printf ("Original: %s\n", data);
2730 _dbus_string_get_const_data (&decoded, &s);
2731 printf ("Decoded: %s\n", s);
2732 _dbus_assert_not_reached ("original string not the same as string decoded from base64");
2735 _dbus_string_free (&orig);
2736 _dbus_string_free (&encoded);
2737 _dbus_string_free (&decoded);
2740 typedef void (* TestRoundtripFunc) (const unsigned char *data,
2743 test_roundtrips (TestRoundtripFunc func)
2745 (* func) ("Hello this is a string\n", -1);
2746 (* func) ("Hello this is a string\n1", -1);
2747 (* func) ("Hello this is a string\n12", -1);
2748 (* func) ("Hello this is a string\n123", -1);
2749 (* func) ("Hello this is a string\n1234", -1);
2750 (* func) ("Hello this is a string\n12345", -1);
2754 (* func) ("123", 3);
2755 (* func) ("1234", 4);
2756 (* func) ("12345", 5);
2760 (* func) ("123", 4);
2761 (* func) ("1234", 5);
2762 (* func) ("12345", 6);
2764 unsigned char buf[512];
2768 while (i < _DBUS_N_ELEMENTS (buf))
2774 while (i < _DBUS_N_ELEMENTS (buf))
2784 * @ingroup DBusStringInternals
2785 * Unit test for DBusString.
2787 * @todo Need to write tests for _dbus_string_copy() and
2788 * _dbus_string_move() moving to/from each of start/middle/end of a
2789 * string. Also need tests for _dbus_string_move_len ()
2791 * @returns #TRUE on success.
2794 _dbus_string_test (void)
2801 int lens[] = { 0, 1, 2, 3, 4, 5, 10, 16, 17, 18, 25, 31, 32, 33, 34, 35, 63, 64, 65, 66, 67, 68, 69, 70, 71, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136 };
2806 while (i < _DBUS_N_ELEMENTS (lens))
2808 if (!_dbus_string_init (&str, lens[i]))
2809 _dbus_assert_not_reached ("failed to init string");
2811 test_max_len (&str, lens[i]);
2812 _dbus_string_free (&str);
2817 /* Test shortening and setting length */
2819 while (i < _DBUS_N_ELEMENTS (lens))
2823 if (!_dbus_string_init (&str, lens[i]))
2824 _dbus_assert_not_reached ("failed to init string");
2826 if (!_dbus_string_set_length (&str, lens[i]))
2827 _dbus_assert_not_reached ("failed to set string length");
2832 _dbus_assert (_dbus_string_get_length (&str) == j);
2835 _dbus_string_shorten (&str, 1);
2836 _dbus_assert (_dbus_string_get_length (&str) == (j - 1));
2841 _dbus_string_free (&str);
2846 /* Test appending data */
2847 if (!_dbus_string_init (&str, _DBUS_INT_MAX))
2848 _dbus_assert_not_reached ("failed to init string");
2853 if (!_dbus_string_append (&str, "a"))
2854 _dbus_assert_not_reached ("failed to append string to string\n");
2856 _dbus_assert (_dbus_string_get_length (&str) == i * 2 + 1);
2858 if (!_dbus_string_append_byte (&str, 'b'))
2859 _dbus_assert_not_reached ("failed to append byte to string\n");
2861 _dbus_assert (_dbus_string_get_length (&str) == i * 2 + 2);
2866 _dbus_string_free (&str);
2868 /* Check steal_data */
2870 if (!_dbus_string_init (&str, _DBUS_INT_MAX))
2871 _dbus_assert_not_reached ("failed to init string");
2873 if (!_dbus_string_append (&str, "Hello World"))
2874 _dbus_assert_not_reached ("could not append to string");
2876 i = _dbus_string_get_length (&str);
2878 if (!_dbus_string_steal_data (&str, &s))
2879 _dbus_assert_not_reached ("failed to steal data");
2881 _dbus_assert (_dbus_string_get_length (&str) == 0);
2882 _dbus_assert (((int)strlen (s)) == i);
2888 if (!_dbus_string_append (&str, "Hello World"))
2889 _dbus_assert_not_reached ("could not append to string");
2891 i = _dbus_string_get_length (&str);
2893 if (!_dbus_string_init (&other, _DBUS_INT_MAX))
2894 _dbus_assert_not_reached ("could not init string");
2896 if (!_dbus_string_move (&str, 0, &other, 0))
2897 _dbus_assert_not_reached ("could not move");
2899 _dbus_assert (_dbus_string_get_length (&str) == 0);
2900 _dbus_assert (_dbus_string_get_length (&other) == i);
2902 if (!_dbus_string_append (&str, "Hello World"))
2903 _dbus_assert_not_reached ("could not append to string");
2905 if (!_dbus_string_move (&str, 0, &other, _dbus_string_get_length (&other)))
2906 _dbus_assert_not_reached ("could not move");
2908 _dbus_assert (_dbus_string_get_length (&str) == 0);
2909 _dbus_assert (_dbus_string_get_length (&other) == i * 2);
2911 if (!_dbus_string_append (&str, "Hello World"))
2912 _dbus_assert_not_reached ("could not append to string");
2914 if (!_dbus_string_move (&str, 0, &other, _dbus_string_get_length (&other) / 2))
2915 _dbus_assert_not_reached ("could not move");
2917 _dbus_assert (_dbus_string_get_length (&str) == 0);
2918 _dbus_assert (_dbus_string_get_length (&other) == i * 3);
2920 _dbus_string_free (&other);
2924 if (!_dbus_string_append (&str, "Hello World"))
2925 _dbus_assert_not_reached ("could not append to string");
2927 i = _dbus_string_get_length (&str);
2929 if (!_dbus_string_init (&other, _DBUS_INT_MAX))
2930 _dbus_assert_not_reached ("could not init string");
2932 if (!_dbus_string_copy (&str, 0, &other, 0))
2933 _dbus_assert_not_reached ("could not copy");
2935 _dbus_assert (_dbus_string_get_length (&str) == i);
2936 _dbus_assert (_dbus_string_get_length (&other) == i);
2938 if (!_dbus_string_copy (&str, 0, &other, _dbus_string_get_length (&other)))
2939 _dbus_assert_not_reached ("could not copy");
2941 _dbus_assert (_dbus_string_get_length (&str) == i);
2942 _dbus_assert (_dbus_string_get_length (&other) == i * 2);
2943 _dbus_assert (_dbus_string_equal_c_str (&other,
2944 "Hello WorldHello World"));
2946 if (!_dbus_string_copy (&str, 0, &other, _dbus_string_get_length (&other) / 2))
2947 _dbus_assert_not_reached ("could not copy");
2949 _dbus_assert (_dbus_string_get_length (&str) == i);
2950 _dbus_assert (_dbus_string_get_length (&other) == i * 3);
2951 _dbus_assert (_dbus_string_equal_c_str (&other,
2952 "Hello WorldHello WorldHello World"));
2954 _dbus_string_free (&str);
2955 _dbus_string_free (&other);
2959 if (!_dbus_string_init (&str, _DBUS_INT_MAX))
2960 _dbus_assert_not_reached ("failed to init string");
2962 if (!_dbus_string_append (&str, "Hello World"))
2963 _dbus_assert_not_reached ("could not append to string");
2965 i = _dbus_string_get_length (&str);
2967 if (!_dbus_string_init (&other, _DBUS_INT_MAX))
2968 _dbus_assert_not_reached ("could not init string");
2970 if (!_dbus_string_replace_len (&str, 0, _dbus_string_get_length (&str),
2971 &other, 0, _dbus_string_get_length (&other)))
2972 _dbus_assert_not_reached ("could not replace");
2974 _dbus_assert (_dbus_string_get_length (&str) == i);
2975 _dbus_assert (_dbus_string_get_length (&other) == i);
2976 _dbus_assert (_dbus_string_equal_c_str (&other, "Hello World"));
2978 if (!_dbus_string_replace_len (&str, 0, _dbus_string_get_length (&str),
2980 _dbus_assert_not_reached ("could not replace center space");
2982 _dbus_assert (_dbus_string_get_length (&str) == i);
2983 _dbus_assert (_dbus_string_get_length (&other) == i * 2 - 1);
2984 _dbus_assert (_dbus_string_equal_c_str (&other,
2985 "HelloHello WorldWorld"));
2988 if (!_dbus_string_replace_len (&str, 1, 1,
2990 _dbus_string_get_length (&other) - 1,
2992 _dbus_assert_not_reached ("could not replace end character");
2994 _dbus_assert (_dbus_string_get_length (&str) == i);
2995 _dbus_assert (_dbus_string_get_length (&other) == i * 2 - 1);
2996 _dbus_assert (_dbus_string_equal_c_str (&other,
2997 "HelloHello WorldWorle"));
2999 _dbus_string_free (&str);
3000 _dbus_string_free (&other);
3002 /* Check append/get unichar */
3004 if (!_dbus_string_init (&str, _DBUS_INT_MAX))
3005 _dbus_assert_not_reached ("failed to init string");
3008 if (!_dbus_string_append_unichar (&str, 0xfffc))
3009 _dbus_assert_not_reached ("failed to append unichar");
3011 _dbus_string_get_unichar (&str, 0, &ch, &i);
3013 _dbus_assert (ch == 0xfffc);
3014 _dbus_assert (i == _dbus_string_get_length (&str));
3016 _dbus_string_free (&str);
3018 /* Check insert/set/get byte */
3020 if (!_dbus_string_init (&str, _DBUS_INT_MAX))
3021 _dbus_assert_not_reached ("failed to init string");
3023 if (!_dbus_string_append (&str, "Hello"))
3024 _dbus_assert_not_reached ("failed to append Hello");
3026 _dbus_assert (_dbus_string_get_byte (&str, 0) == 'H');
3027 _dbus_assert (_dbus_string_get_byte (&str, 1) == 'e');
3028 _dbus_assert (_dbus_string_get_byte (&str, 2) == 'l');
3029 _dbus_assert (_dbus_string_get_byte (&str, 3) == 'l');
3030 _dbus_assert (_dbus_string_get_byte (&str, 4) == 'o');
3032 _dbus_string_set_byte (&str, 1, 'q');
3033 _dbus_assert (_dbus_string_get_byte (&str, 1) == 'q');
3035 if (!_dbus_string_insert_byte (&str, 0, 255))
3036 _dbus_assert_not_reached ("can't insert byte");
3038 if (!_dbus_string_insert_byte (&str, 2, 'Z'))
3039 _dbus_assert_not_reached ("can't insert byte");
3041 if (!_dbus_string_insert_byte (&str, _dbus_string_get_length (&str), 'W'))
3042 _dbus_assert_not_reached ("can't insert byte");
3044 _dbus_assert (_dbus_string_get_byte (&str, 0) == 255);
3045 _dbus_assert (_dbus_string_get_byte (&str, 1) == 'H');
3046 _dbus_assert (_dbus_string_get_byte (&str, 2) == 'Z');
3047 _dbus_assert (_dbus_string_get_byte (&str, 3) == 'q');
3048 _dbus_assert (_dbus_string_get_byte (&str, 4) == 'l');
3049 _dbus_assert (_dbus_string_get_byte (&str, 5) == 'l');
3050 _dbus_assert (_dbus_string_get_byte (&str, 6) == 'o');
3051 _dbus_assert (_dbus_string_get_byte (&str, 7) == 'W');
3053 _dbus_string_free (&str);
3055 /* Check append/parse int/double */
3057 if (!_dbus_string_init (&str, _DBUS_INT_MAX))
3058 _dbus_assert_not_reached ("failed to init string");
3060 if (!_dbus_string_append_int (&str, 27))
3061 _dbus_assert_not_reached ("failed to append int");
3063 i = _dbus_string_get_length (&str);
3065 if (!_dbus_string_parse_int (&str, 0, &v, &end))
3066 _dbus_assert_not_reached ("failed to parse int");
3068 _dbus_assert (v == 27);
3069 _dbus_assert (end == i);
3071 _dbus_string_free (&str);
3073 if (!_dbus_string_init (&str, _DBUS_INT_MAX))
3074 _dbus_assert_not_reached ("failed to init string");
3076 if (!_dbus_string_append_double (&str, 50.3))
3077 _dbus_assert_not_reached ("failed to append float");
3079 i = _dbus_string_get_length (&str);
3081 if (!_dbus_string_parse_double (&str, 0, &d, &end))
3082 _dbus_assert_not_reached ("failed to parse float");
3084 _dbus_assert (d > (50.3 - 1e-6) && d < (50.3 + 1e-6));
3085 _dbus_assert (end == i);
3087 _dbus_string_free (&str);
3090 if (!_dbus_string_init (&str, _DBUS_INT_MAX))
3091 _dbus_assert_not_reached ("failed to init string");
3093 if (!_dbus_string_append (&str, "Hello"))
3094 _dbus_assert_not_reached ("couldn't append to string");
3096 if (!_dbus_string_find (&str, 0, "He", &i))
3097 _dbus_assert_not_reached ("didn't find 'He'");
3098 _dbus_assert (i == 0);
3100 if (!_dbus_string_find (&str, 0, "Hello", &i))
3101 _dbus_assert_not_reached ("didn't find 'Hello'");
3102 _dbus_assert (i == 0);
3104 if (!_dbus_string_find (&str, 0, "ello", &i))
3105 _dbus_assert_not_reached ("didn't find 'ello'");
3106 _dbus_assert (i == 1);
3108 if (!_dbus_string_find (&str, 0, "lo", &i))
3109 _dbus_assert_not_reached ("didn't find 'lo'");
3110 _dbus_assert (i == 3);
3112 if (!_dbus_string_find (&str, 2, "lo", &i))
3113 _dbus_assert_not_reached ("didn't find 'lo'");
3114 _dbus_assert (i == 3);
3116 if (_dbus_string_find (&str, 4, "lo", &i))
3117 _dbus_assert_not_reached ("did find 'lo'");
3119 if (!_dbus_string_find (&str, 0, "l", &i))
3120 _dbus_assert_not_reached ("didn't find 'l'");
3121 _dbus_assert (i == 2);
3123 if (!_dbus_string_find (&str, 0, "H", &i))
3124 _dbus_assert_not_reached ("didn't find 'H'");
3125 _dbus_assert (i == 0);
3127 if (!_dbus_string_find (&str, 0, "", &i))
3128 _dbus_assert_not_reached ("didn't find ''");
3129 _dbus_assert (i == 0);
3131 if (_dbus_string_find (&str, 0, "Hello!", NULL))
3132 _dbus_assert_not_reached ("Did find 'Hello!'");
3134 if (_dbus_string_find (&str, 0, "Oh, Hello", NULL))
3135 _dbus_assert_not_reached ("Did find 'Oh, Hello'");
3137 if (_dbus_string_find (&str, 0, "ill", NULL))
3138 _dbus_assert_not_reached ("Did find 'ill'");
3140 if (_dbus_string_find (&str, 0, "q", NULL))
3141 _dbus_assert_not_reached ("Did find 'q'");
3143 if (!_dbus_string_find_to (&str, 0, 2, "He", NULL))
3144 _dbus_assert_not_reached ("Didn't find 'He'");
3146 if (_dbus_string_find_to (&str, 0, 2, "Hello", NULL))
3147 _dbus_assert_not_reached ("Did find 'Hello'");
3149 _dbus_string_free (&str);
3151 /* Base 64 and Hex encoding */
3152 test_roundtrips (test_base64_roundtrip);
3153 test_roundtrips (test_hex_roundtrip);
3158 #endif /* DBUS_BUILD_TESTS */