1 /* GLIB - Library of useful routines for C programming
2 * Copyright (C) 1995-1997 Peter Mattis, Spencer Kimball and Josh MacDonald
4 * This library is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
9 * This library is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
19 * Modified by the GLib Team and others 1997-2000. See the AUTHORS
20 * file for a list of people on the GLib Team. See the ChangeLog
21 * files for a list of changes. These files are distributed with
22 * GLib at ftp://ftp.gtk.org/pub/gtk/.
45 * @short_description: text buffers which grow automatically
48 * A #GString is an object that handles the memory management of a C
49 * string for you. The emphasis of #GString is on text, typically
50 * UTF-8. Crucially, the "str" member of a #GString is guaranteed to
51 * have a trailing nul character, and it is therefore always safe to
52 * call functions such as strchr() or g_strdup() on it.
54 * However, a #GString can also hold arbitrary binary data, because it
55 * has a "len" member, which includes any possible embedded nul
56 * characters in the data. Conceptually then, #GString is like a
57 * #GByteArray with the addition of many convenience methods for text,
58 * and a guaranteed nul terminator.
63 * @str: points to the character data. It may move as text is added.
64 * The @str field is null-terminated and so
65 * can be used as an ordinary C string.
66 * @len: contains the length of the string, not including the
67 * terminating nul byte.
68 * @allocated_len: the number of bytes that can be stored in the
69 * string before it needs to be reallocated. May be larger than @len.
71 * The GString struct contains the public fields of a GString.
75 #define MY_MAXSIZE ((gsize)-1)
78 nearest_power (gsize base
, gsize num
)
80 if (num
> MY_MAXSIZE
/ 2)
96 g_string_maybe_expand (GString
*string
,
99 if (string
->len
+ len
>= string
->allocated_len
)
101 string
->allocated_len
= nearest_power (1, string
->len
+ len
+ 1);
102 string
->str
= g_realloc (string
->str
, string
->allocated_len
);
107 * g_string_sized_new:
108 * @dfl_size: the default size of the space allocated to
111 * Creates a new #GString, with enough space for @dfl_size
112 * bytes. This is useful if you are going to add a lot of
113 * text to the string and don't want it to be reallocated
116 * Returns: the new #GString
119 g_string_sized_new (gsize dfl_size
)
121 GString
*string
= g_slice_new (GString
);
123 string
->allocated_len
= 0;
127 g_string_maybe_expand (string
, MAX (dfl_size
, 2));
135 * @init: (nullable): the initial text to copy into the string, or %NULL to
136 * start with an empty string
138 * Creates a new #GString, initialized with the given string.
140 * Returns: the new #GString
143 g_string_new (const gchar
*init
)
147 if (init
== NULL
|| *init
== '\0')
148 string
= g_string_sized_new (2);
154 string
= g_string_sized_new (len
+ 2);
156 g_string_append_len (string
, init
, len
);
164 * @init: initial contents of the string
165 * @len: length of @init to use
167 * Creates a new #GString with @len bytes of the @init buffer.
168 * Because a length is provided, @init need not be nul-terminated,
169 * and can contain embedded nul bytes.
171 * Since this function does not stop at nul bytes, it is the caller's
172 * responsibility to ensure that @init has at least @len addressable
175 * Returns: a new #GString
178 g_string_new_len (const gchar
*init
,
184 return g_string_new (init
);
187 string
= g_string_sized_new (len
);
190 g_string_append_len (string
, init
, len
);
198 * @string: (transfer full): a #GString
199 * @free_segment: if %TRUE, the actual character data is freed as well
201 * Frees the memory allocated for the #GString.
202 * If @free_segment is %TRUE it also frees the character data. If
203 * it's %FALSE, the caller gains ownership of the buffer and must
204 * free it after use with g_free().
206 * Returns: (nullable): the character data of @string
207 * (i.e. %NULL if @free_segment is %TRUE)
210 g_string_free (GString
*string
,
211 gboolean free_segment
)
215 g_return_val_if_fail (string
!= NULL
, NULL
);
219 g_free (string
->str
);
223 segment
= string
->str
;
225 g_slice_free (GString
, string
);
231 * g_string_free_to_bytes:
232 * @string: (transfer full): a #GString
234 * Transfers ownership of the contents of @string to a newly allocated
235 * #GBytes. The #GString structure itself is deallocated, and it is
236 * therefore invalid to use @string after invoking this function.
238 * Note that while #GString ensures that its buffer always has a
239 * trailing nul character (not reflected in its "len"), the returned
240 * #GBytes does not include this extra nul; i.e. it has length exactly
241 * equal to the "len" member.
243 * Returns: (transfer full): A newly allocated #GBytes containing contents of @string; @string itself is freed
247 g_string_free_to_bytes (GString
*string
)
252 g_return_val_if_fail (string
!= NULL
, NULL
);
256 buf
= g_string_free (string
, FALSE
);
258 return g_bytes_new_take (buf
, len
);
264 * @v2: another #GString
266 * Compares two strings for equality, returning %TRUE if they are equal.
267 * For use with #GHashTable.
269 * Returns: %TRUE if the strings are the same length and contain the
273 g_string_equal (const GString
*v
,
277 GString
*string1
= (GString
*) v
;
278 GString
*string2
= (GString
*) v2
;
279 gsize i
= string1
->len
;
281 if (i
!= string2
->len
)
299 * @str: a string to hash
301 * Creates a hash code for @str; for use with #GHashTable.
303 * Returns: hash code for @str
306 g_string_hash (const GString
*str
)
308 const gchar
*p
= str
->str
;
312 /* 31 bit hash function */
315 h
= (h
<< 5) - h
+ *p
;
324 * @string: the destination #GString. Its current contents
326 * @rval: the string to copy into @string
328 * Copies the bytes from a string into a #GString,
329 * destroying any previous contents. It is rather like
330 * the standard strcpy() function, except that you do not
331 * have to worry about having enough space to copy the string.
333 * Returns: (transfer none): @string
336 g_string_assign (GString
*string
,
339 g_return_val_if_fail (string
!= NULL
, NULL
);
340 g_return_val_if_fail (rval
!= NULL
, string
);
342 /* Make sure assigning to itself doesn't corrupt the string. */
343 if (string
->str
!= rval
)
345 /* Assigning from substring should be ok, since
346 * g_string_truncate() does not reallocate.
348 g_string_truncate (string
, 0);
349 g_string_append (string
, rval
);
357 * @string: a #GString
358 * @len: the new size of @string
360 * Cuts off the end of the GString, leaving the first @len bytes.
362 * Returns: (transfer none): @string
365 g_string_truncate (GString
*string
,
368 g_return_val_if_fail (string
!= NULL
, NULL
);
370 string
->len
= MIN (len
, string
->len
);
371 string
->str
[string
->len
] = 0;
378 * @string: a #GString
379 * @len: the new length
381 * Sets the length of a #GString. If the length is less than
382 * the current length, the string will be truncated. If the
383 * length is greater than the current length, the contents
384 * of the newly added area are undefined. (However, as
385 * always, string->str[string->len] will be a nul byte.)
387 * Returns: (transfer none): @string
390 g_string_set_size (GString
*string
,
393 g_return_val_if_fail (string
!= NULL
, NULL
);
395 if (len
>= string
->allocated_len
)
396 g_string_maybe_expand (string
, len
- string
->len
);
399 string
->str
[len
] = 0;
405 * g_string_insert_len:
406 * @string: a #GString
407 * @pos: position in @string where insertion should
408 * happen, or -1 for at the end
409 * @val: bytes to insert
410 * @len: number of bytes of @val to insert
412 * Inserts @len bytes of @val into @string at @pos.
413 * Because @len is provided, @val may contain embedded
414 * nuls and need not be nul-terminated. If @pos is -1,
415 * bytes are inserted at the end of the string.
417 * Since this function does not stop at nul bytes, it is
418 * the caller's responsibility to ensure that @val has at
419 * least @len addressable bytes.
421 * Returns: (transfer none): @string
424 g_string_insert_len (GString
*string
,
429 g_return_val_if_fail (string
!= NULL
, NULL
);
430 g_return_val_if_fail (len
== 0 || val
!= NULL
, string
);
441 g_return_val_if_fail (pos
<= string
->len
, string
);
443 /* Check whether val represents a substring of string.
444 * This test probably violates chapter and verse of the C standards,
445 * since ">=" and "<=" are only valid when val really is a substring.
446 * In practice, it will work on modern archs.
448 if (G_UNLIKELY (val
>= string
->str
&& val
<= string
->str
+ string
->len
))
450 gsize offset
= val
- string
->str
;
453 g_string_maybe_expand (string
, len
);
454 val
= string
->str
+ offset
;
455 /* At this point, val is valid again. */
457 /* Open up space where we are going to insert. */
458 if (pos
< string
->len
)
459 memmove (string
->str
+ pos
+ len
, string
->str
+ pos
, string
->len
- pos
);
461 /* Move the source part before the gap, if any. */
464 precount
= MIN (len
, pos
- offset
);
465 memcpy (string
->str
+ pos
, val
, precount
);
468 /* Move the source part after the gap, if any. */
470 memcpy (string
->str
+ pos
+ precount
,
471 val
+ /* Already moved: */ precount
+ /* Space opened up: */ len
,
476 g_string_maybe_expand (string
, len
);
478 /* If we aren't appending at the end, move a hunk
479 * of the old string to the end, opening up space
481 if (pos
< string
->len
)
482 memmove (string
->str
+ pos
+ len
, string
->str
+ pos
, string
->len
- pos
);
484 /* insert the new string */
486 string
->str
[pos
] = *val
;
488 memcpy (string
->str
+ pos
, val
, len
);
493 string
->str
[string
->len
] = 0;
498 #define SUB_DELIM_CHARS "!$&'()*+,;="
502 const char *reserved_chars_allowed
)
504 if (g_ascii_isalnum (c
) ||
511 if (reserved_chars_allowed
&&
512 strchr (reserved_chars_allowed
, c
) != NULL
)
519 gunichar_ok (gunichar c
)
522 (c
!= (gunichar
) -2) &&
523 (c
!= (gunichar
) -1);
527 * g_string_append_uri_escaped:
528 * @string: a #GString
529 * @unescaped: a string
530 * @reserved_chars_allowed: a string of reserved characters allowed
531 * to be used, or %NULL
532 * @allow_utf8: set %TRUE if the escaped string may include UTF8 characters
534 * Appends @unescaped to @string, escaped any characters that
535 * are reserved in URIs using URI-style escape sequences.
537 * Returns: (transfer none): @string
542 g_string_append_uri_escaped (GString
*string
,
543 const gchar
*unescaped
,
544 const gchar
*reserved_chars_allowed
,
549 static const gchar hex
[16] = "0123456789ABCDEF";
551 g_return_val_if_fail (string
!= NULL
, NULL
);
552 g_return_val_if_fail (unescaped
!= NULL
, NULL
);
554 end
= unescaped
+ strlen (unescaped
);
556 while ((c
= *unescaped
) != 0)
558 if (c
>= 0x80 && allow_utf8
&&
559 gunichar_ok (g_utf8_get_char_validated (unescaped
, end
- unescaped
)))
561 int len
= g_utf8_skip
[c
];
562 g_string_append_len (string
, unescaped
, len
);
565 else if (is_valid (c
, reserved_chars_allowed
))
567 g_string_append_c (string
, c
);
572 g_string_append_c (string
, '%');
573 g_string_append_c (string
, hex
[((guchar
)c
) >> 4]);
574 g_string_append_c (string
, hex
[((guchar
)c
) & 0xf]);
584 * @string: a #GString
585 * @val: the string to append onto the end of @string
587 * Adds a string onto the end of a #GString, expanding
590 * Returns: (transfer none): @string
593 g_string_append (GString
*string
,
596 return g_string_insert_len (string
, -1, val
, -1);
600 * g_string_append_len:
601 * @string: a #GString
602 * @val: bytes to append
603 * @len: number of bytes of @val to use
605 * Appends @len bytes of @val to @string. Because @len is
606 * provided, @val may contain embedded nuls and need not
609 * Since this function does not stop at nul bytes, it is
610 * the caller's responsibility to ensure that @val has at
611 * least @len addressable bytes.
613 * Returns: (transfer none): @string
616 g_string_append_len (GString
*string
,
620 return g_string_insert_len (string
, -1, val
, len
);
625 * @string: a #GString
626 * @c: the byte to append onto the end of @string
628 * Adds a byte onto the end of a #GString, expanding
631 * Returns: (transfer none): @string
633 #undef g_string_append_c
635 g_string_append_c (GString
*string
,
638 g_return_val_if_fail (string
!= NULL
, NULL
);
640 return g_string_insert_c (string
, -1, c
);
644 * g_string_append_unichar:
645 * @string: a #GString
646 * @wc: a Unicode character
648 * Converts a Unicode character into UTF-8, and appends it
651 * Returns: (transfer none): @string
654 g_string_append_unichar (GString
*string
,
657 g_return_val_if_fail (string
!= NULL
, NULL
);
659 return g_string_insert_unichar (string
, -1, wc
);
664 * @string: a #GString
665 * @val: the string to prepend on the start of @string
667 * Adds a string on to the start of a #GString,
668 * expanding it if necessary.
670 * Returns: (transfer none): @string
673 g_string_prepend (GString
*string
,
676 return g_string_insert_len (string
, 0, val
, -1);
680 * g_string_prepend_len:
681 * @string: a #GString
682 * @val: bytes to prepend
683 * @len: number of bytes in @val to prepend
685 * Prepends @len bytes of @val to @string.
686 * Because @len is provided, @val may contain
687 * embedded nuls and need not be nul-terminated.
689 * Since this function does not stop at nul bytes,
690 * it is the caller's responsibility to ensure that
691 * @val has at least @len addressable bytes.
693 * Returns: (transfer none): @string
696 g_string_prepend_len (GString
*string
,
700 return g_string_insert_len (string
, 0, val
, len
);
704 * g_string_prepend_c:
705 * @string: a #GString
706 * @c: the byte to prepend on the start of the #GString
708 * Adds a byte onto the start of a #GString,
709 * expanding it if necessary.
711 * Returns: (transfer none): @string
714 g_string_prepend_c (GString
*string
,
717 g_return_val_if_fail (string
!= NULL
, NULL
);
719 return g_string_insert_c (string
, 0, c
);
723 * g_string_prepend_unichar:
724 * @string: a #GString
725 * @wc: a Unicode character
727 * Converts a Unicode character into UTF-8, and prepends it
730 * Returns: (transfer none): @string
733 g_string_prepend_unichar (GString
*string
,
736 g_return_val_if_fail (string
!= NULL
, NULL
);
738 return g_string_insert_unichar (string
, 0, wc
);
743 * @string: a #GString
744 * @pos: the position to insert the copy of the string
745 * @val: the string to insert
747 * Inserts a copy of a string into a #GString,
748 * expanding it if necessary.
750 * Returns: (transfer none): @string
753 g_string_insert (GString
*string
,
757 return g_string_insert_len (string
, pos
, val
, -1);
762 * @string: a #GString
763 * @pos: the position to insert the byte
764 * @c: the byte to insert
766 * Inserts a byte into a #GString, expanding it if necessary.
768 * Returns: (transfer none): @string
771 g_string_insert_c (GString
*string
,
775 g_return_val_if_fail (string
!= NULL
, NULL
);
777 g_string_maybe_expand (string
, 1);
782 g_return_val_if_fail (pos
<= string
->len
, string
);
784 /* If not just an append, move the old stuff */
785 if (pos
< string
->len
)
786 memmove (string
->str
+ pos
+ 1, string
->str
+ pos
, string
->len
- pos
);
788 string
->str
[pos
] = c
;
792 string
->str
[string
->len
] = 0;
798 * g_string_insert_unichar:
799 * @string: a #GString
800 * @pos: the position at which to insert character, or -1
801 * to append at the end of the string
802 * @wc: a Unicode character
804 * Converts a Unicode character into UTF-8, and insert it
805 * into the string at the given position.
807 * Returns: (transfer none): @string
810 g_string_insert_unichar (GString
*string
,
814 gint charlen
, first
, i
;
817 g_return_val_if_fail (string
!= NULL
, NULL
);
819 /* Code copied from g_unichar_to_utf() */
830 else if (wc
< 0x10000)
835 else if (wc
< 0x200000)
840 else if (wc
< 0x4000000)
850 /* End of copied code */
852 g_string_maybe_expand (string
, charlen
);
857 g_return_val_if_fail (pos
<= string
->len
, string
);
859 /* If not just an append, move the old stuff */
860 if (pos
< string
->len
)
861 memmove (string
->str
+ pos
+ charlen
, string
->str
+ pos
, string
->len
- pos
);
863 dest
= string
->str
+ pos
;
864 /* Code copied from g_unichar_to_utf() */
865 for (i
= charlen
- 1; i
> 0; --i
)
867 dest
[i
] = (wc
& 0x3f) | 0x80;
870 dest
[0] = wc
| first
;
871 /* End of copied code */
873 string
->len
+= charlen
;
875 string
->str
[string
->len
] = 0;
881 * g_string_overwrite:
882 * @string: a #GString
883 * @pos: the position at which to start overwriting
884 * @val: the string that will overwrite the @string starting at @pos
886 * Overwrites part of a string, lengthening it if necessary.
888 * Returns: (transfer none): @string
893 g_string_overwrite (GString
*string
,
897 g_return_val_if_fail (val
!= NULL
, string
);
898 return g_string_overwrite_len (string
, pos
, val
, strlen (val
));
902 * g_string_overwrite_len:
903 * @string: a #GString
904 * @pos: the position at which to start overwriting
905 * @val: the string that will overwrite the @string starting at @pos
906 * @len: the number of bytes to write from @val
908 * Overwrites part of a string, lengthening it if necessary.
909 * This function will work with embedded nuls.
911 * Returns: (transfer none): @string
916 g_string_overwrite_len (GString
*string
,
923 g_return_val_if_fail (string
!= NULL
, NULL
);
928 g_return_val_if_fail (val
!= NULL
, string
);
929 g_return_val_if_fail (pos
<= string
->len
, string
);
936 if (end
> string
->len
)
937 g_string_maybe_expand (string
, end
- string
->len
);
939 memcpy (string
->str
+ pos
, val
, len
);
941 if (end
> string
->len
)
943 string
->str
[end
] = '\0';
952 * @string: a #GString
953 * @pos: the position of the content to remove
954 * @len: the number of bytes to remove, or -1 to remove all
957 * Removes @len bytes from a #GString, starting at position @pos.
958 * The rest of the #GString is shifted down to fill the gap.
960 * Returns: (transfer none): @string
963 g_string_erase (GString
*string
,
967 g_return_val_if_fail (string
!= NULL
, NULL
);
968 g_return_val_if_fail (pos
>= 0, string
);
969 g_return_val_if_fail (pos
<= string
->len
, string
);
972 len
= string
->len
- pos
;
975 g_return_val_if_fail (pos
+ len
<= string
->len
, string
);
977 if (pos
+ len
< string
->len
)
978 memmove (string
->str
+ pos
, string
->str
+ pos
+ len
, string
->len
- (pos
+ len
));
983 string
->str
[string
->len
] = 0;
989 * g_string_ascii_down:
992 * Converts all uppercase ASCII letters to lowercase ASCII letters.
994 * Returns: (transfer none): passed-in @string pointer, with all the
995 * uppercase characters converted to lowercase in place,
996 * with semantics that exactly match g_ascii_tolower().
999 g_string_ascii_down (GString
*string
)
1004 g_return_val_if_fail (string
!= NULL
, NULL
);
1011 *s
= g_ascii_tolower (*s
);
1020 * g_string_ascii_up:
1021 * @string: a GString
1023 * Converts all lowercase ASCII letters to uppercase ASCII letters.
1025 * Returns: (transfer none): passed-in @string pointer, with all the
1026 * lowercase characters converted to uppercase in place,
1027 * with semantics that exactly match g_ascii_toupper().
1030 g_string_ascii_up (GString
*string
)
1035 g_return_val_if_fail (string
!= NULL
, NULL
);
1042 *s
= g_ascii_toupper (*s
);
1052 * @string: a #GString
1054 * Converts a #GString to lowercase.
1056 * Returns: (transfer none): the #GString
1058 * Deprecated:2.2: This function uses the locale-specific
1059 * tolower() function, which is almost never the right thing.
1060 * Use g_string_ascii_down() or g_utf8_strdown() instead.
1063 g_string_down (GString
*string
)
1068 g_return_val_if_fail (string
!= NULL
, NULL
);
1071 s
= (guchar
*) string
->str
;
1086 * @string: a #GString
1088 * Converts a #GString to uppercase.
1090 * Returns: (transfer none): @string
1092 * Deprecated:2.2: This function uses the locale-specific
1093 * toupper() function, which is almost never the right thing.
1094 * Use g_string_ascii_up() or g_utf8_strup() instead.
1097 g_string_up (GString
*string
)
1102 g_return_val_if_fail (string
!= NULL
, NULL
);
1105 s
= (guchar
*) string
->str
;
1119 * g_string_append_vprintf:
1120 * @string: a #GString
1121 * @format: the string format. See the printf() documentation
1122 * @args: the list of arguments to insert in the output
1124 * Appends a formatted string onto the end of a #GString.
1125 * This function is similar to g_string_append_printf()
1126 * except that the arguments to the format string are passed
1132 g_string_append_vprintf (GString
*string
,
1133 const gchar
*format
,
1139 g_return_if_fail (string
!= NULL
);
1140 g_return_if_fail (format
!= NULL
);
1142 len
= g_vasprintf (&buf
, format
, args
);
1146 g_string_maybe_expand (string
, len
);
1147 memcpy (string
->str
+ string
->len
, buf
, len
+ 1);
1155 * @string: a #GString
1156 * @format: the string format. See the printf() documentation
1157 * @args: the parameters to insert into the format string
1159 * Writes a formatted string into a #GString.
1160 * This function is similar to g_string_printf() except that
1161 * the arguments to the format string are passed as a va_list.
1166 g_string_vprintf (GString
*string
,
1167 const gchar
*format
,
1170 g_string_truncate (string
, 0);
1171 g_string_append_vprintf (string
, format
, args
);
1176 * @string: a #GString
1177 * @format: the string format. See the sprintf() documentation
1178 * @...: the parameters to insert into the format string
1180 * Writes a formatted string into a #GString.
1181 * This is similar to the standard sprintf() function,
1182 * except that the #GString buffer automatically expands
1183 * to contain the results. The previous contents of the
1184 * #GString are destroyed.
1186 * Deprecated: This function has been renamed to g_string_printf().
1191 * @string: a #GString
1192 * @format: the string format. See the printf() documentation
1193 * @...: the parameters to insert into the format string
1195 * Writes a formatted string into a #GString.
1196 * This is similar to the standard sprintf() function,
1197 * except that the #GString buffer automatically expands
1198 * to contain the results. The previous contents of the
1199 * #GString are destroyed.
1202 g_string_printf (GString
*string
,
1203 const gchar
*format
,
1208 g_string_truncate (string
, 0);
1210 va_start (args
, format
);
1211 g_string_append_vprintf (string
, format
, args
);
1216 * g_string_sprintfa:
1217 * @string: a #GString
1218 * @format: the string format. See the sprintf() documentation
1219 * @...: the parameters to insert into the format string
1221 * Appends a formatted string onto the end of a #GString.
1222 * This function is similar to g_string_sprintf() except that
1223 * the text is appended to the #GString.
1225 * Deprecated: This function has been renamed to g_string_append_printf()
1229 * g_string_append_printf:
1230 * @string: a #GString
1231 * @format: the string format. See the printf() documentation
1232 * @...: the parameters to insert into the format string
1234 * Appends a formatted string onto the end of a #GString.
1235 * This function is similar to g_string_printf() except
1236 * that the text is appended to the #GString.
1239 g_string_append_printf (GString
*string
,
1240 const gchar
*format
,
1245 va_start (args
, format
);
1246 g_string_append_vprintf (string
, format
, args
);