glib/gstrfuncs.c

   1 /* GLIB - Library of useful routines for C programming
   2  * Copyright (C) 1995-1997  Peter Mattis, Spencer Kimball and Josh MacDonald
   3  *
   4  * This library is free software; you can redistribute it and/or
   5  * modify it under the terms of the GNU Lesser General Public
   6  * License as published by the Free Software Foundation; either
   7  * version 2 of the License, or (at your option) any later version.
   8  *
   9  * This library is distributed in the hope that it will be useful,
  10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  12  * Lesser General Public License for more details.
  13  *
  14  * You should have received a copy of the GNU Lesser General Public
  15  * License along with this library; if not, see <http://www.gnu.org/licenses/>.
  16  */
  17
  18 /*
  19  * Modified by the GLib Team and others 1997-2000.  See the AUTHORS
  20  * file for a list of people on the GLib Team.  See the ChangeLog
  21  * files for a list of changes.  These files are distributed with
  22  * GLib at ftp://ftp.gtk.org/pub/gtk/.
  23  */
  24
  25 /*
  26  * MT safe
  27  */
  28
  29 #include "config.h"
  30
  31 #include <stdarg.h>
  32 #include <stdio.h>
  33 #include <stdlib.h>
  34 #include <locale.h>
  35 #include <string.h>
  36 #include <locale.h>
  37 #include <errno.h>
  38 #include <ctype.h>              /* For tolower() */
  39
  40 #ifdef HAVE_XLOCALE_H
  41 /* Needed on BSD/OS X for e.g. strtod_l */
  42 #include <xlocale.h>
  43 #endif
  44
  45 #ifdef G_OS_WIN32
  46 #include <windows.h>
  47 #endif
  48
  49 /* do not include <unistd.h> here, it may interfere with g_strsignal() */
  50
  51 #include "gstrfuncs.h"
  52
  53 #include "gprintf.h"
  54 #include "gprintfint.h"
  55 #include "glibintl.h"
  56
  57
  58 /**
  59  * SECTION:string_utils
  60  * @title: String Utility Functions
  61  * @short_description: various string-related functions
  62  *
  63  * This section describes a number of utility functions for creating,
  64  * duplicating, and manipulating strings.
  65  *
  66  * Note that the functions g_printf(), g_fprintf(), g_sprintf(),
  67  * g_snprintf(), g_vprintf(), g_vfprintf(), g_vsprintf() and g_vsnprintf()
  68  * are declared in the header `gprintf.h` which is not included in `glib.h`
  69  * (otherwise using `glib.h` would drag in `stdio.h`), so you'll have to
  70  * explicitly include `<glib/gprintf.h>` in order to use the GLib
  71  * printf() functions.
  72  *
  73  * ## String precision pitfalls # {#string-precision}
  74  *
  75  * While you may use the printf() functions to format UTF-8 strings,
  76  * notice that the precision of a \%Ns parameter is interpreted
  77  * as the number of bytes, not characters to print. On top of that,
  78  * the GNU libc implementation of the printf() functions has the
  79  * "feature" that it checks that the string given for the \%Ns
  80  * parameter consists of a whole number of characters in the current
  81  * encoding. So, unless you are sure you are always going to be in an
  82  * UTF-8 locale or your know your text is restricted to ASCII, avoid
  83  * using \%Ns. If your intention is to format strings for a
  84  * certain number of columns, then \%Ns is not a correct solution
  85  * anyway, since it fails to take wide characters (see g_unichar_iswide())
  86  * into account.
  87  */
  88
  89 /**
  90  * g_ascii_isalnum:
  91  * @c: any character
  92  *
  93  * Determines whether a character is alphanumeric.
  94  *
  95  * Unlike the standard C library isalnum() function, this only
  96  * recognizes standard ASCII letters and ignores the locale,
  97  * returning %FALSE for all non-ASCII characters. Also, unlike
  98  * the standard library function, this takes a char, not an int,
  99  * so don't call it on %EOF, but no need to cast to #guchar before
 100  * passing a possibly non-ASCII character in.
 101  *
 102  * Returns: %TRUE if @c is an ASCII alphanumeric character
 103  */
 104
 105 /**
 106  * g_ascii_isalpha:
 107  * @c: any character
 108  *
 109  * Determines whether a character is alphabetic (i.e. a letter).
 110  *
 111  * Unlike the standard C library isalpha() function, this only
 112  * recognizes standard ASCII letters and ignores the locale,
 113  * returning %FALSE for all non-ASCII characters. Also, unlike
 114  * the standard library function, this takes a char, not an int,
 115  * so don't call it on %EOF, but no need to cast to #guchar before
 116  * passing a possibly non-ASCII character in.
 117  *
 118  * Returns: %TRUE if @c is an ASCII alphabetic character
 119  */
 120
 121 /**
 122  * g_ascii_iscntrl:
 123  * @c: any character
 124  *
 125  * Determines whether a character is a control character.
 126  *
 127  * Unlike the standard C library iscntrl() function, this only
 128  * recognizes standard ASCII control characters and ignores the
 129  * locale, returning %FALSE for all non-ASCII characters. Also,
 130  * unlike the standard library function, this takes a char, not
 131  * an int, so don't call it on %EOF, but no need to cast to #guchar
 132  * before passing a possibly non-ASCII character in.
 133  *
 134  * Returns: %TRUE if @c is an ASCII control character.
 135  */
 136
 137 /**
 138  * g_ascii_isdigit:
 139  * @c: any character
 140  *
 141  * Determines whether a character is digit (0-9).
 142  *
 143  * Unlike the standard C library isdigit() function, this takes
 144  * a char, not an int, so don't call it  on %EOF, but no need to
 145  * cast to #guchar before passing a possibly non-ASCII character in.
 146  *
 147  * Returns: %TRUE if @c is an ASCII digit.
 148  */
 149
 150 /**
 151  * g_ascii_isgraph:
 152  * @c: any character
 153  *
 154  * Determines whether a character is a printing character and not a space.
 155  *
 156  * Unlike the standard C library isgraph() function, this only
 157  * recognizes standard ASCII characters and ignores the locale,
 158  * returning %FALSE for all non-ASCII characters. Also, unlike
 159  * the standard library function, this takes a char, not an int,
 160  * so don't call it on %EOF, but no need to cast to #guchar before
 161  * passing a possibly non-ASCII character in.
 162  *
 163  * Returns: %TRUE if @c is an ASCII printing character other than space.
 164  */
 165
 166 /**
 167  * g_ascii_islower:
 168  * @c: any character
 169  *
 170  * Determines whether a character is an ASCII lower case letter.
 171  *
 172  * Unlike the standard C library islower() function, this only
 173  * recognizes standard ASCII letters and ignores the locale,
 174  * returning %FALSE for all non-ASCII characters. Also, unlike
 175  * the standard library function, this takes a char, not an int,
 176  * so don't call it on %EOF, but no need to worry about casting
 177  * to #guchar before passing a possibly non-ASCII character in.
 178  *
 179  * Returns: %TRUE if @c is an ASCII lower case letter
 180  */
 181
 182 /**
 183  * g_ascii_isprint:
 184  * @c: any character
 185  *
 186  * Determines whether a character is a printing character.
 187  *
 188  * Unlike the standard C library isprint() function, this only
 189  * recognizes standard ASCII characters and ignores the locale,
 190  * returning %FALSE for all non-ASCII characters. Also, unlike
 191  * the standard library function, this takes a char, not an int,
 192  * so don't call it on %EOF, but no need to cast to #guchar before
 193  * passing a possibly non-ASCII character in.
 194  *
 195  * Returns: %TRUE if @c is an ASCII printing character.
 196  */
 197
 198 /**
 199  * g_ascii_ispunct:
 200  * @c: any character
 201  *
 202  * Determines whether a character is a punctuation character.
 203  *
 204  * Unlike the standard C library ispunct() function, this only
 205  * recognizes standard ASCII letters and ignores the locale,
 206  * returning %FALSE for all non-ASCII characters. Also, unlike
 207  * the standard library function, this takes a char, not an int,
 208  * so don't call it on %EOF, but no need to cast to #guchar before
 209  * passing a possibly non-ASCII character in.
 210  *
 211  * Returns: %TRUE if @c is an ASCII punctuation character.
 212  */
 213
 214 /**
 215  * g_ascii_isspace:
 216  * @c: any character
 217  *
 218  * Determines whether a character is a white-space character.
 219  *
 220  * Unlike the standard C library isspace() function, this only
 221  * recognizes standard ASCII white-space and ignores the locale,
 222  * returning %FALSE for all non-ASCII characters. Also, unlike
 223  * the standard library function, this takes a char, not an int,
 224  * so don't call it on %EOF, but no need to cast to #guchar before
 225  * passing a possibly non-ASCII character in.
 226  *
 227  * Returns: %TRUE if @c is an ASCII white-space character
 228  */
 229
 230 /**
 231  * g_ascii_isupper:
 232  * @c: any character
 233  *
 234  * Determines whether a character is an ASCII upper case letter.
 235  *
 236  * Unlike the standard C library isupper() function, this only
 237  * recognizes standard ASCII letters and ignores the locale,
 238  * returning %FALSE for all non-ASCII characters. Also, unlike
 239  * the standard library function, this takes a char, not an int,
 240  * so don't call it on %EOF, but no need to worry about casting
 241  * to #guchar before passing a possibly non-ASCII character in.
 242  *
 243  * Returns: %TRUE if @c is an ASCII upper case letter
 244  */
 245
 246 /**
 247  * g_ascii_isxdigit:
 248  * @c: any character
 249  *
 250  * Determines whether a character is a hexadecimal-digit character.
 251  *
 252  * Unlike the standard C library isxdigit() function, this takes
 253  * a char, not an int, so don't call it on %EOF, but no need to
 254  * cast to #guchar before passing a possibly non-ASCII character in.
 255  *
 256  * Returns: %TRUE if @c is an ASCII hexadecimal-digit character.
 257  */
 258
 259 /**
 260  * G_ASCII_DTOSTR_BUF_SIZE:
 261  *
 262  * A good size for a buffer to be passed into g_ascii_dtostr().
 263  * It is guaranteed to be enough for all output of that function
 264  * on systems with 64bit IEEE-compatible doubles.
 265  *
 266  * The typical usage would be something like:
 267  * |[<!-- language="C" -->
 268  *   char buf[G_ASCII_DTOSTR_BUF_SIZE];
 269  *
 270  *   fprintf (out, "value=%s\n", g_ascii_dtostr (buf, sizeof (buf), value));
 271  * ]|
 272  */
 273
 274 /**
 275  * g_strstrip:
 276  * @string: a string to remove the leading and trailing whitespace from
 277  *
 278  * Removes leading and trailing whitespace from a string.
 279  * See g_strchomp() and g_strchug().
 280  *
 281  * Returns: @string
 282  */
 283
 284 /**
 285  * G_STR_DELIMITERS:
 286  *
 287  * The standard delimiters, used in g_strdelimit().
 288  */
 289
 290 static const guint16 ascii_table_data[256] = {
 291   0x004, 0x004, 0x004, 0x004, 0x004, 0x004, 0x004, 0x004,
 292   0x004, 0x104, 0x104, 0x004, 0x104, 0x104, 0x004, 0x004,
 293   0x004, 0x004, 0x004, 0x004, 0x004, 0x004, 0x004, 0x004,
 294   0x004, 0x004, 0x004, 0x004, 0x004, 0x004, 0x004, 0x004,
 295   0x140, 0x0d0, 0x0d0, 0x0d0, 0x0d0, 0x0d0, 0x0d0, 0x0d0,
 296   0x0d0, 0x0d0, 0x0d0, 0x0d0, 0x0d0, 0x0d0, 0x0d0, 0x0d0,
 297   0x459, 0x459, 0x459, 0x459, 0x459, 0x459, 0x459, 0x459,
 298   0x459, 0x459, 0x0d0, 0x0d0, 0x0d0, 0x0d0, 0x0d0, 0x0d0,
 299   0x0d0, 0x653, 0x653, 0x653, 0x653, 0x653, 0x653, 0x253,
 300   0x253, 0x253, 0x253, 0x253, 0x253, 0x253, 0x253, 0x253,
 301   0x253, 0x253, 0x253, 0x253, 0x253, 0x253, 0x253, 0x253,
 302   0x253, 0x253, 0x253, 0x0d0, 0x0d0, 0x0d0, 0x0d0, 0x0d0,
 303   0x0d0, 0x473, 0x473, 0x473, 0x473, 0x473, 0x473, 0x073,
 304   0x073, 0x073, 0x073, 0x073, 0x073, 0x073, 0x073, 0x073,
 305   0x073, 0x073, 0x073, 0x073, 0x073, 0x073, 0x073, 0x073,
 306   0x073, 0x073, 0x073, 0x0d0, 0x0d0, 0x0d0, 0x0d0, 0x004
 307   /* the upper 128 are all zeroes */
 308 };
 309
 310 const guint16 * const g_ascii_table = ascii_table_data;
 311
 312 #if defined (HAVE_NEWLOCALE) && \
 313     defined (HAVE_USELOCALE) && \
 314     defined (HAVE_STRTOD_L) && \
 315     defined (HAVE_STRTOULL_L) && \
 316     defined (HAVE_STRTOLL_L)
 317 #define USE_XLOCALE 1
 318 #endif
 319
 320 #ifdef USE_XLOCALE
 321 static locale_t
 322 get_C_locale (void)
 323 {
 324   static gsize initialized = FALSE;
 325   static locale_t C_locale = NULL;
 326
 327   if (g_once_init_enter (&initialized))
 328     {
 329       C_locale = newlocale (LC_ALL_MASK, "C", NULL);
 330       g_once_init_leave (&initialized, TRUE);
 331     }
 332
 333   return C_locale;
 334 }
 335 #endif
 336
 337 /**
 338  * g_strdup:
 339  * @str: the string to duplicate
 340  *
 341  * Duplicates a string. If @str is %NULL it returns %NULL.
 342  * The returned string should be freed with g_free()
 343  * when no longer needed.
 344  *
 345  * Returns: a newly-allocated copy of @str
 346  */
 347 gchar*
 348 g_strdup (const gchar *str)
 349 {
 350   gchar *new_str;
 351   gsize length;
 352
 353   if (str)
 354     {
 355       length = strlen (str) + 1;
 356       new_str = g_new (char, length);
 357       memcpy (new_str, str, length);
 358     }
 359   else
 360     new_str = NULL;
 361
 362   return new_str;
 363 }
 364
 365 /**
 366  * g_memdup:
 367  * @mem: the memory to copy.
 368  * @byte_size: the number of bytes to copy.
 369  *
 370  * Allocates @byte_size bytes of memory, and copies @byte_size bytes into it
 371  * from @mem. If @mem is %NULL it returns %NULL.
 372  *
 373  * Returns: a pointer to the newly-allocated copy of the memory, or %NULL if @mem
 374  *  is %NULL.
 375  */
 376 gpointer
 377 g_memdup (gconstpointer mem,
 378           guint         byte_size)
 379 {
 380   gpointer new_mem;
 381
 382   if (mem)
 383     {
 384       new_mem = g_malloc (byte_size);
 385       memcpy (new_mem, mem, byte_size);
 386     }
 387   else
 388     new_mem = NULL;
 389
 390   return new_mem;
 391 }
 392
 393 /**
 394  * g_strndup:
 395  * @str: the string to duplicate
 396  * @n: the maximum number of bytes to copy from @str
 397  *
 398  * Duplicates the first @n bytes of a string, returning a newly-allocated
 399  * buffer @n + 1 bytes long which will always be nul-terminated. If @str
 400  * is less than @n bytes long the buffer is padded with nuls. If @str is
 401  * %NULL it returns %NULL. The returned value should be freed when no longer
 402  * needed.
 403  *
 404  * To copy a number of characters from a UTF-8 encoded string,
 405  * use g_utf8_strncpy() instead.
 406  *
 407  * Returns: a newly-allocated buffer containing the first @n bytes
 408  *     of @str, nul-terminated
 409  */
 410 gchar*
 411 g_strndup (const gchar *str,
 412            gsize        n)
 413 {
 414   gchar *new_str;
 415
 416   if (str)
 417     {
 418       new_str = g_new (gchar, n + 1);
 419       strncpy (new_str, str, n);
 420       new_str[n] = '\0';
 421     }
 422   else
 423     new_str = NULL;
 424
 425   return new_str;
 426 }
 427
 428 /**
 429  * g_strnfill:
 430  * @length: the length of the new string
 431  * @fill_char: the byte to fill the string with
 432  *
 433  * Creates a new string @length bytes long filled with @fill_char.
 434  * The returned string should be freed when no longer needed.
 435  *
 436  * Returns: a newly-allocated string filled the @fill_char
 437  */
 438 gchar*
 439 g_strnfill (gsize length,
 440             gchar fill_char)
 441 {
 442   gchar *str;
 443
 444   str = g_new (gchar, length + 1);
 445   memset (str, (guchar)fill_char, length);
 446   str[length] = '\0';
 447
 448   return str;
 449 }
 450
 451 /**
 452  * g_stpcpy:
 453  * @dest: destination buffer.
 454  * @src: source string.
 455  *
 456  * Copies a nul-terminated string into the dest buffer, include the
 457  * trailing nul, and return a pointer to the trailing nul byte.
 458  * This is useful for concatenating multiple strings together
 459  * without having to repeatedly scan for the end.
 460  *
 461  * Returns: a pointer to trailing nul byte.
 462  **/
 463 gchar *
 464 g_stpcpy (gchar       *dest,
 465           const gchar *src)
 466 {
 467 #ifdef HAVE_STPCPY
 468   g_return_val_if_fail (dest != NULL, NULL);
 469   g_return_val_if_fail (src != NULL, NULL);
 470   return stpcpy (dest, src);
 471 #else
 472   gchar *d = dest;
 473   const gchar *s = src;
 474
 475   g_return_val_if_fail (dest != NULL, NULL);
 476   g_return_val_if_fail (src != NULL, NULL);
 477   do
 478     *d++ = *s;
 479   while (*s++ != '\0');
 480
 481   return d - 1;
 482 #endif
 483 }
 484
 485 /**
 486  * g_strdup_vprintf:
 487  * @format: a standard printf() format string, but notice
 488  *     [string precision pitfalls][string-precision]
 489  * @args: the list of parameters to insert into the format string
 490  *
 491  * Similar to the standard C vsprintf() function but safer, since it
 492  * calculates the maximum space required and allocates memory to hold
 493  * the result. The returned string should be freed with g_free() when
 494  * no longer needed.
 495  *
 496  * See also g_vasprintf(), which offers the same functionality, but
 497  * additionally returns the length of the allocated string.
 498  *
 499  * Returns: a newly-allocated string holding the result
 500  */
 501 gchar*
 502 g_strdup_vprintf (const gchar *format,
 503                   va_list      args)
 504 {
 505   gchar *string = NULL;
 506
 507   g_vasprintf (&string, format, args);
 508
 509   return string;
 510 }
 511
 512 /**
 513  * g_strdup_printf:
 514  * @format: a standard printf() format string, but notice
 515  *     [string precision pitfalls][string-precision]
 516  * @...: the parameters to insert into the format string
 517  *
 518  * Similar to the standard C sprintf() function but safer, since it
 519  * calculates the maximum space required and allocates memory to hold
 520  * the result. The returned string should be freed with g_free() when no
 521  * longer needed.
 522  *
 523  * Returns: a newly-allocated string holding the result
 524  */
 525 gchar*
 526 g_strdup_printf (const gchar *format,
 527                  ...)
 528 {
 529   gchar *buffer;
 530   va_list args;
 531
 532   va_start (args, format);
 533   buffer = g_strdup_vprintf (format, args);
 534   va_end (args);
 535
 536   return buffer;
 537 }
 538
 539 /**
 540  * g_strconcat:
 541  * @string1: the first string to add, which must not be %NULL
 542  * @...: a %NULL-terminated list of strings to append to the string
 543  *
 544  * Concatenates all of the given strings into one long string. The
 545  * returned string should be freed with g_free() when no longer needed.
 546  *
 547  * The variable argument list must end with %NULL. If you forget the %NULL,
 548  * g_strconcat() will start appending random memory junk to your string.
 549  *
 550  * Note that this function is usually not the right function to use to
 551  * assemble a translated message from pieces, since proper translation
 552  * often requires the pieces to be reordered.
 553  *
 554  * Returns: a newly-allocated string containing all the string arguments
 555  */
 556 gchar*
 557 g_strconcat (const gchar *string1, ...)
 558 {
 559   gsize   l;
 560   va_list args;
 561   gchar   *s;
 562   gchar   *concat;
 563   gchar   *ptr;
 564
 565   if (!string1)
 566     return NULL;
 567
 568   l = 1 + strlen (string1);
 569   va_start (args, string1);
 570   s = va_arg (args, gchar*);
 571   while (s)
 572     {
 573       l += strlen (s);
 574       s = va_arg (args, gchar*);
 575     }
 576   va_end (args);
 577
 578   concat = g_new (gchar, l);
 579   ptr = concat;
 580
 581   ptr = g_stpcpy (ptr, string1);
 582   va_start (args, string1);
 583   s = va_arg (args, gchar*);
 584   while (s)
 585     {
 586       ptr = g_stpcpy (ptr, s);
 587       s = va_arg (args, gchar*);
 588     }
 589   va_end (args);
 590
 591   return concat;
 592 }
 593
 594 /**
 595  * g_strtod:
 596  * @nptr:    the string to convert to a numeric value.
 597  * @endptr:  if non-%NULL, it returns the character after
 598  *           the last character used in the conversion.
 599  *
 600  * Converts a string to a #gdouble value.
 601  * It calls the standard strtod() function to handle the conversion, but
 602  * if the string is not completely converted it attempts the conversion
 603  * again with g_ascii_strtod(), and returns the best match.
 604  *
 605  * This function should seldom be used. The normal situation when reading
 606  * numbers not for human consumption is to use g_ascii_strtod(). Only when
 607  * you know that you must expect both locale formatted and C formatted numbers
 608  * should you use this. Make sure that you don't pass strings such as comma
 609  * separated lists of values, since the commas may be interpreted as a decimal
 610  * point in some locales, causing unexpected results.
 611  *
 612  * Returns: the #gdouble value.
 613  **/
 614 gdouble
 615 g_strtod (const gchar *nptr,
 616           gchar      **endptr)
 617 {
 618   gchar *fail_pos_1;
 619   gchar *fail_pos_2;
 620   gdouble val_1;
 621   gdouble val_2 = 0;
 622
 623   g_return_val_if_fail (nptr != NULL, 0);
 624
 625   fail_pos_1 = NULL;
 626   fail_pos_2 = NULL;
 627
 628   val_1 = strtod (nptr, &fail_pos_1);
 629
 630   if (fail_pos_1 && fail_pos_1[0] != 0)
 631     val_2 = g_ascii_strtod (nptr, &fail_pos_2);
 632
 633   if (!fail_pos_1 || fail_pos_1[0] == 0 || fail_pos_1 >= fail_pos_2)
 634     {
 635       if (endptr)
 636         *endptr = fail_pos_1;
 637       return val_1;
 638     }
 639   else
 640     {
 641       if (endptr)
 642         *endptr = fail_pos_2;
 643       return val_2;
 644     }
 645 }
 646
 647 /**
 648  * g_ascii_strtod:
 649  * @nptr:    the string to convert to a numeric value.
 650  * @endptr:  if non-%NULL, it returns the character after
 651  *           the last character used in the conversion.
 652  *
 653  * Converts a string to a #gdouble value.
 654  *
 655  * This function behaves like the standard strtod() function
 656  * does in the C locale. It does this without actually changing
 657  * the current locale, since that would not be thread-safe.
 658  * A limitation of the implementation is that this function
 659  * will still accept localized versions of infinities and NANs.
 660  *
 661  * This function is typically used when reading configuration
 662  * files or other non-user input that should be locale independent.
 663  * To handle input from the user you should normally use the
 664  * locale-sensitive system strtod() function.
 665  *
 666  * To convert from a #gdouble to a string in a locale-insensitive
 667  * way, use g_ascii_dtostr().
 668  *
 669  * If the correct value would cause overflow, plus or minus %HUGE_VAL
 670  * is returned (according to the sign of the value), and %ERANGE is
 671  * stored in %errno. If the correct value would cause underflow,
 672  * zero is returned and %ERANGE is stored in %errno.
 673  *
 674  * This function resets %errno before calling strtod() so that
 675  * you can reliably detect overflow and underflow.
 676  *
 677  * Returns: the #gdouble value.
 678  */
 679 gdouble
 680 g_ascii_strtod (const gchar *nptr,
 681                 gchar      **endptr)
 682 {
 683 #ifdef USE_XLOCALE
 684
 685   g_return_val_if_fail (nptr != NULL, 0);
 686
 687   errno = 0;
 688
 689   return strtod_l (nptr, endptr, get_C_locale ());
 690
 691 #else
 692
 693   gchar *fail_pos;
 694   gdouble val;
 695 #ifndef __BIONIC__
 696   struct lconv *locale_data;
 697 #endif
 698   const char *decimal_point;
 699   int decimal_point_len;
 700   const char *p, *decimal_point_pos;
 701   const char *end = NULL; /* Silence gcc */
 702   int strtod_errno;
 703
 704   g_return_val_if_fail (nptr != NULL, 0);
 705
 706   fail_pos = NULL;
 707
 708 #ifndef __BIONIC__
 709   locale_data = localeconv ();
 710   decimal_point = locale_data->decimal_point;
 711   decimal_point_len = strlen (decimal_point);
 712 #else
 713   decimal_point = ".";
 714   decimal_point_len = 1;
 715 #endif
 716
 717   g_assert (decimal_point_len != 0);
 718
 719   decimal_point_pos = NULL;
 720   end = NULL;
 721
 722   if (decimal_point[0] != '.' ||
 723       decimal_point[1] != 0)
 724     {
 725       p = nptr;
 726       /* Skip leading space */
 727       while (g_ascii_isspace (*p))
 728         p++;
 729
 730       /* Skip leading optional sign */
 731       if (*p == '+' || *p == '-')
 732         p++;
 733
 734       if (p[0] == '0' &&
 735           (p[1] == 'x' || p[1] == 'X'))
 736         {
 737           p += 2;
 738           /* HEX - find the (optional) decimal point */
 739
 740           while (g_ascii_isxdigit (*p))
 741             p++;
 742
 743           if (*p == '.')
 744             decimal_point_pos = p++;
 745
 746           while (g_ascii_isxdigit (*p))
 747             p++;
 748
 749           if (*p == 'p' || *p == 'P')
 750             p++;
 751           if (*p == '+' || *p == '-')
 752             p++;
 753           while (g_ascii_isdigit (*p))
 754             p++;
 755
 756           end = p;
 757         }
 758       else if (g_ascii_isdigit (*p) || *p == '.')
 759         {
 760           while (g_ascii_isdigit (*p))
 761             p++;
 762
 763           if (*p == '.')
 764             decimal_point_pos = p++;
 765
 766           while (g_ascii_isdigit (*p))
 767             p++;
 768
 769           if (*p == 'e' || *p == 'E')
 770             p++;
 771           if (*p == '+' || *p == '-')
 772             p++;
 773           while (g_ascii_isdigit (*p))
 774             p++;
 775
 776           end = p;
 777         }
 778       /* For the other cases, we need not convert the decimal point */
 779     }
 780
 781   if (decimal_point_pos)
 782     {
 783       char *copy, *c;
 784
 785       /* We need to convert the '.' to the locale specific decimal point */
 786       copy = g_malloc (end - nptr + 1 + decimal_point_len);
 787
 788       c = copy;
 789       memcpy (c, nptr, decimal_point_pos - nptr);
 790       c += decimal_point_pos - nptr;
 791       memcpy (c, decimal_point, decimal_point_len);
 792       c += decimal_point_len;
 793       memcpy (c, decimal_point_pos + 1, end - (decimal_point_pos + 1));
 794       c += end - (decimal_point_pos + 1);
 795       *c = 0;
 796
 797       errno = 0;
 798       val = strtod (copy, &fail_pos);
 799       strtod_errno = errno;
 800
 801       if (fail_pos)
 802         {
 803           if (fail_pos - copy > decimal_point_pos - nptr)
 804             fail_pos = (char *)nptr + (fail_pos - copy) - (decimal_point_len - 1);
 805           else
 806             fail_pos = (char *)nptr + (fail_pos - copy);
 807         }
 808
 809       g_free (copy);
 810
 811     }
 812   else if (end)
 813     {
 814       char *copy;
 815
 816       copy = g_malloc (end - (char *)nptr + 1);
 817       memcpy (copy, nptr, end - nptr);
 818       *(copy + (end - (char *)nptr)) = 0;
 819
 820       errno = 0;
 821       val = strtod (copy, &fail_pos);
 822       strtod_errno = errno;
 823
 824       if (fail_pos)
 825         {
 826           fail_pos = (char *)nptr + (fail_pos - copy);
 827         }
 828
 829       g_free (copy);
 830     }
 831   else
 832     {
 833       errno = 0;
 834       val = strtod (nptr, &fail_pos);
 835       strtod_errno = errno;
 836     }
 837
 838   if (endptr)
 839     *endptr = fail_pos;
 840
 841   errno = strtod_errno;
 842
 843   return val;
 844 #endif
 845 }
 846
 847
 848 /**
 849  * g_ascii_dtostr:
 850  * @buffer: A buffer to place the resulting string in
 851  * @buf_len: The length of the buffer.
 852  * @d: The #gdouble to convert
 853  *
 854  * Converts a #gdouble to a string, using the '.' as
 855  * decimal point.
 856  *
 857  * This function generates enough precision that converting
 858  * the string back using g_ascii_strtod() gives the same machine-number
 859  * (on machines with IEEE compatible 64bit doubles). It is
 860  * guaranteed that the size of the resulting string will never
 861  * be larger than @G_ASCII_DTOSTR_BUF_SIZE bytes, including the terminating
 862  * nul character, which is always added.
 863  *
 864  * Returns: The pointer to the buffer with the converted string.
 865  **/
 866 gchar *
 867 g_ascii_dtostr (gchar       *buffer,
 868                 gint         buf_len,
 869                 gdouble      d)
 870 {
 871   return g_ascii_formatd (buffer, buf_len, "%.17g", d);
 872 }
 873
 874 #pragma GCC diagnostic push
 875 #pragma GCC diagnostic ignored "-Wformat-nonliteral"
 876
 877 /**
 878  * g_ascii_formatd:
 879  * @buffer: A buffer to place the resulting string in
 880  * @buf_len: The length of the buffer.
 881  * @format: The printf()-style format to use for the
 882  *          code to use for converting.
 883  * @d: The #gdouble to convert
 884  *
 885  * Converts a #gdouble to a string, using the '.' as
 886  * decimal point. To format the number you pass in
 887  * a printf()-style format string. Allowed conversion
 888  * specifiers are 'e', 'E', 'f', 'F', 'g' and 'G'.
 889  *
 890  * The returned buffer is guaranteed to be nul-terminated.
 891  *
 892  * If you just want to want to serialize the value into a
 893  * string, use g_ascii_dtostr().
 894  *
 895  * Returns: The pointer to the buffer with the converted string.
 896  */
 897 gchar *
 898 g_ascii_formatd (gchar       *buffer,
 899                  gint         buf_len,
 900                  const gchar *format,
 901                  gdouble      d)
 902 {
 903 #ifdef USE_XLOCALE
 904   locale_t old_locale;
 905
 906   old_locale = uselocale (get_C_locale ());
 907    _g_snprintf (buffer, buf_len, format, d);
 908   uselocale (old_locale);
 909
 910   return buffer;
 911 #else
 912 #ifndef __BIONIC__
 913   struct lconv *locale_data;
 914 #endif
 915   const char *decimal_point;
 916   int decimal_point_len;
 917   gchar *p;
 918   int rest_len;
 919   gchar format_char;
 920
 921   g_return_val_if_fail (buffer != NULL, NULL);
 922   g_return_val_if_fail (format[0] == '%', NULL);
 923   g_return_val_if_fail (strpbrk (format + 1, "'l%") == NULL, NULL);
 924
 925   format_char = format[strlen (format) - 1];
 926
 927   g_return_val_if_fail (format_char == 'e' || format_char == 'E' ||
 928                         format_char == 'f' || format_char == 'F' ||
 929                         format_char == 'g' || format_char == 'G',
 930                         NULL);
 931
 932   if (format[0] != '%')
 933     return NULL;
 934
 935   if (strpbrk (format + 1, "'l%"))
 936     return NULL;
 937
 938   if (!(format_char == 'e' || format_char == 'E' ||
 939         format_char == 'f' || format_char == 'F' ||
 940         format_char == 'g' || format_char == 'G'))
 941     return NULL;
 942
 943   _g_snprintf (buffer, buf_len, format, d);
 944
 945 #ifndef __BIONIC__
 946   locale_data = localeconv ();
 947   decimal_point = locale_data->decimal_point;
 948   decimal_point_len = strlen (decimal_point);
 949 #else
 950   decimal_point = ".";
 951   decimal_point_len = 1;
 952 #endif
 953
 954   g_assert (decimal_point_len != 0);
 955
 956   if (decimal_point[0] != '.' ||
 957       decimal_point[1] != 0)
 958     {
 959       p = buffer;
 960
 961       while (g_ascii_isspace (*p))
 962         p++;
 963
 964       if (*p == '+' || *p == '-')
 965         p++;
 966
 967       while (isdigit ((guchar)*p))
 968         p++;
 969
 970       if (strncmp (p, decimal_point, decimal_point_len) == 0)
 971         {
 972           *p = '.';
 973           p++;
 974           if (decimal_point_len > 1)
 975             {
 976               rest_len = strlen (p + (decimal_point_len-1));
 977               memmove (p, p + (decimal_point_len-1), rest_len);
 978               p[rest_len] = 0;
 979             }
 980         }
 981     }
 982
 983   return buffer;
 984 #endif
 985 }
 986 #pragma GCC diagnostic pop
 987
 988 #define ISSPACE(c)              ((c) == ' ' || (c) == '\f' || (c) == '\n' || \
 989                                  (c) == '\r' || (c) == '\t' || (c) == '\v')
 990 #define ISUPPER(c)              ((c) >= 'A' && (c) <= 'Z')
 991 #define ISLOWER(c)              ((c) >= 'a' && (c) <= 'z')
 992 #define ISALPHA(c)              (ISUPPER (c) || ISLOWER (c))
 993 #define TOUPPER(c)              (ISLOWER (c) ? (c) - 'a' + 'A' : (c))
 994 #define TOLOWER(c)              (ISUPPER (c) ? (c) - 'A' + 'a' : (c))
 995
 996 #ifndef USE_XLOCALE
 997
 998 static guint64
 999 g_parse_long_long (const gchar  *nptr,
1000                    const gchar **endptr,
1001                    guint         base,
1002                    gboolean     *negative)
1003 {
1004   /* this code is based on on the strtol(3) code from GNU libc released under
1005    * the GNU Lesser General Public License.
1006    *
1007    * Copyright (C) 1991,92,94,95,96,97,98,99,2000,01,02
1008    *        Free Software Foundation, Inc.
1009    */
1010   gboolean overflow;
1011   guint64 cutoff;
1012   guint64 cutlim;
1013   guint64 ui64;
1014   const gchar *s, *save;
1015   guchar c;
1016
1017   g_return_val_if_fail (nptr != NULL, 0);
1018
1019   *negative = FALSE;
1020   if (base == 1 || base > 36)
1021     {
1022       errno = EINVAL;
1023       if (endptr)
1024         *endptr = nptr;
1025       return 0;
1026     }
1027
1028   save = s = nptr;
1029
1030   /* Skip white space.  */
1031   while (ISSPACE (*s))
1032     ++s;
1033
1034   if (G_UNLIKELY (!*s))
1035     goto noconv;
1036
1037   /* Check for a sign.  */
1038   if (*s == '-')
1039     {
1040       *negative = TRUE;
1041       ++s;
1042     }
1043   else if (*s == '+')
1044     ++s;
1045
1046   /* Recognize number prefix and if BASE is zero, figure it out ourselves.  */
1047   if (*s == '0')
1048     {
1049       if ((base == 0 || base == 16) && TOUPPER (s[1]) == 'X')
1050         {
1051           s += 2;
1052           base = 16;
1053         }
1054       else if (base == 0)
1055         base = 8;
1056     }
1057   else if (base == 0)
1058     base = 10;
1059
1060   /* Save the pointer so we can check later if anything happened.  */
1061   save = s;
1062   cutoff = G_MAXUINT64 / base;
1063   cutlim = G_MAXUINT64 % base;
1064
1065   overflow = FALSE;
1066   ui64 = 0;
1067   c = *s;
1068   for (; c; c = *++s)
1069     {
1070       if (c >= '0' && c <= '9')
1071         c -= '0';
1072       else if (ISALPHA (c))
1073         c = TOUPPER (c) - 'A' + 10;
1074       else
1075         break;
1076       if (c >= base)
1077         break;
1078       /* Check for overflow.  */
1079       if (ui64 > cutoff || (ui64 == cutoff && c > cutlim))
1080         overflow = TRUE;
1081       else
1082         {
1083           ui64 *= base;
1084           ui64 += c;
1085         }
1086     }
1087
1088   /* Check if anything actually happened.  */
1089   if (s == save)
1090     goto noconv;
1091
1092   /* Store in ENDPTR the address of one character
1093      past the last character we converted.  */
1094   if (endptr)
1095     *endptr = s;
1096
1097   if (G_UNLIKELY (overflow))
1098     {
1099       errno = ERANGE;
1100       return G_MAXUINT64;
1101     }
1102
1103   return ui64;
1104
1105  noconv:
1106   /* We must handle a special case here: the base is 0 or 16 and the
1107      first two characters are '0' and 'x', but the rest are no
1108      hexadecimal digits.  This is no error case.  We return 0 and
1109      ENDPTR points to the `x`.  */
1110   if (endptr)
1111     {
1112       if (save - nptr >= 2 && TOUPPER (save[-1]) == 'X'
1113           && save[-2] == '0')
1114         *endptr = &save[-1];
1115       else
1116         /*  There was no number to convert.  */
1117         *endptr = nptr;
1118     }
1119   return 0;
1120 }
1121 #endif /* !USE_XLOCALE */
1122
1123 /**
1124  * g_ascii_strtoull:
1125  * @nptr:    the string to convert to a numeric value.
1126  * @endptr:  if non-%NULL, it returns the character after
1127  *           the last character used in the conversion.
1128  * @base:    to be used for the conversion, 2..36 or 0
1129  *
1130  * Converts a string to a #guint64 value.
1131  * This function behaves like the standard strtoull() function
1132  * does in the C locale. It does this without actually
1133  * changing the current locale, since that would not be
1134  * thread-safe.
1135  *
1136  * This function is typically used when reading configuration
1137  * files or other non-user input that should be locale independent.
1138  * To handle input from the user you should normally use the
1139  * locale-sensitive system strtoull() function.
1140  *
1141  * If the correct value would cause overflow, %G_MAXUINT64
1142  * is returned, and `ERANGE` is stored in `errno`.
1143  * If the base is outside the valid range, zero is returned, and
1144  * `EINVAL` is stored in `errno`.
1145  * If the string conversion fails, zero is returned, and @endptr returns
1146  * @nptr (if @endptr is non-%NULL).
1147  *
1148  * Returns: the #guint64 value or zero on error.
1149  *
1150  * Since: 2.2
1151  */
1152 guint64
1153 g_ascii_strtoull (const gchar *nptr,
1154                   gchar      **endptr,
1155                   guint        base)
1156 {
1157 #ifdef USE_XLOCALE
1158   return strtoull_l (nptr, endptr, base, get_C_locale ());
1159 #else
1160   gboolean negative;
1161   guint64 result;
1162
1163   result = g_parse_long_long (nptr, (const gchar **) endptr, base, &negative);
1164
1165   /* Return the result of the appropriate sign.  */
1166   return negative ? -result : result;
1167 #endif
1168 }
1169
1170 /**
1171  * g_ascii_strtoll:
1172  * @nptr:    the string to convert to a numeric value.
1173  * @endptr:  if non-%NULL, it returns the character after
1174  *           the last character used in the conversion.
1175  * @base:    to be used for the conversion, 2..36 or 0
1176  *
1177  * Converts a string to a #gint64 value.
1178  * This function behaves like the standard strtoll() function
1179  * does in the C locale. It does this without actually
1180  * changing the current locale, since that would not be
1181  * thread-safe.
1182  *
1183  * This function is typically used when reading configuration
1184  * files or other non-user input that should be locale independent.
1185  * To handle input from the user you should normally use the
1186  * locale-sensitive system strtoll() function.
1187  *
1188  * If the correct value would cause overflow, %G_MAXINT64 or %G_MININT64
1189  * is returned, and `ERANGE` is stored in `errno`.
1190  * If the base is outside the valid range, zero is returned, and
1191  * `EINVAL` is stored in `errno`. If the
1192  * string conversion fails, zero is returned, and @endptr returns @nptr
1193  * (if @endptr is non-%NULL).
1194  *
1195  * Returns: the #gint64 value or zero on error.
1196  *
1197  * Since: 2.12
1198  */
1199 gint64
1200 g_ascii_strtoll (const gchar *nptr,
1201                  gchar      **endptr,
1202                  guint        base)
1203 {
1204 #ifdef USE_XLOCALE
1205   return strtoll_l (nptr, endptr, base, get_C_locale ());
1206 #else
1207   gboolean negative;
1208   guint64 result;
1209
1210   result = g_parse_long_long (nptr, (const gchar **) endptr, base, &negative);
1211
1212   if (negative && result > (guint64) G_MININT64)
1213     {
1214       errno = ERANGE;
1215       return G_MININT64;
1216     }
1217   else if (!negative && result > (guint64) G_MAXINT64)
1218     {
1219       errno = ERANGE;
1220       return G_MAXINT64;
1221     }
1222   else if (negative)
1223     return - (gint64) result;
1224   else
1225     return (gint64) result;
1226 #endif
1227 }
1228
1229 /**
1230  * g_strerror:
1231  * @errnum: the system error number. See the standard C %errno
1232  *     documentation
1233  *
1234  * Returns a string corresponding to the given error code, e.g.
1235  * "no such process". You should use this function in preference to
1236  * strerror(), because it returns a string in UTF-8 encoding, and since
1237  * not all platforms support the strerror() function.
1238  *
1239  * Returns: a UTF-8 string describing the error code. If the error code
1240  *     is unknown, it returns "unknown error (<code>)".
1241  */
1242 const gchar *
1243 g_strerror (gint errnum)
1244 {
1245   gchar *msg;
1246   gchar *tofree = NULL;
1247   const gchar *ret;
1248   gint saved_errno = errno;
1249
1250   msg = strerror (errnum);
1251   if (!g_get_charset (NULL))
1252     msg = tofree = g_locale_to_utf8 (msg, -1, NULL, NULL, NULL);
1253
1254   ret = g_intern_string (msg);
1255   g_free (tofree);
1256   errno = saved_errno;
1257   return ret;
1258 }
1259
1260 /**
1261  * g_strsignal:
1262  * @signum: the signal number. See the `signal` documentation
1263  *
1264  * Returns a string describing the given signal, e.g. "Segmentation fault".
1265  * You should use this function in preference to strsignal(), because it
1266  * returns a string in UTF-8 encoding, and since not all platforms support
1267  * the strsignal() function.
1268  *
1269  * Returns: a UTF-8 string describing the signal. If the signal is unknown,
1270  *     it returns "unknown signal (<signum>)".
1271  */
1272 const gchar *
1273 g_strsignal (gint signum)
1274 {
1275   gchar *msg;
1276   gchar *tofree;
1277   const gchar *ret;
1278
1279   msg = tofree = NULL;
1280
1281 #ifdef HAVE_STRSIGNAL
1282   msg = strsignal (signum);
1283   if (!g_get_charset (NULL))
1284     msg = tofree = g_locale_to_utf8 (msg, -1, NULL, NULL, NULL);
1285 #endif
1286
1287   if (!msg)
1288     msg = tofree = g_strdup_printf ("unknown signal (%d)", signum);
1289   ret = g_intern_string (msg);
1290   g_free (tofree);
1291
1292   return ret;
1293 }
1294
1295 /* Functions g_strlcpy and g_strlcat were originally developed by
1296  * Todd C. Miller <Todd.Miller@courtesan.com> to simplify writing secure code.
1297  * See http://www.openbsd.org/cgi-bin/man.cgi?query=strlcpy
1298  * for more information.
1299  */
1300
1301 #ifdef HAVE_STRLCPY
1302 /* Use the native ones, if available; they might be implemented in assembly */
1303 gsize
1304 g_strlcpy (gchar       *dest,
1305            const gchar *src,
1306            gsize        dest_size)
1307 {
1308   g_return_val_if_fail (dest != NULL, 0);
1309   g_return_val_if_fail (src  != NULL, 0);
1310
1311   return strlcpy (dest, src, dest_size);
1312 }
1313
1314 gsize
1315 g_strlcat (gchar       *dest,
1316            const gchar *src,
1317            gsize        dest_size)
1318 {
1319   g_return_val_if_fail (dest != NULL, 0);
1320   g_return_val_if_fail (src  != NULL, 0);
1321
1322   return strlcat (dest, src, dest_size);
1323 }
1324
1325 #else /* ! HAVE_STRLCPY */
1326 /**
1327  * g_strlcpy:
1328  * @dest: destination buffer
1329  * @src: source buffer
1330  * @dest_size: length of @dest in bytes
1331  *
1332  * Portability wrapper that calls strlcpy() on systems which have it,
1333  * and emulates strlcpy() otherwise. Copies @src to @dest; @dest is
1334  * guaranteed to be nul-terminated; @src must be nul-terminated;
1335  * @dest_size is the buffer size, not the number of bytes to copy.
1336  *
1337  * At most @dest_size - 1 characters will be copied. Always nul-terminates
1338  * (unless @dest_size is 0). This function does not allocate memory. Unlike
1339  * strncpy(), this function doesn't pad @dest (so it's often faster). It
1340  * returns the size of the attempted result, strlen (src), so if
1341  * @retval >= @dest_size, truncation occurred.
1342  *
1343  * Caveat: strlcpy() is supposedly more secure than strcpy() or strncpy(),
1344  * but if you really want to avoid screwups, g_strdup() is an even better
1345  * idea.
1346  *
1347  * Returns: length of @src
1348  */
1349 gsize
1350 g_strlcpy (gchar       *dest,
1351            const gchar *src,
1352            gsize        dest_size)
1353 {
1354   gchar *d = dest;
1355   const gchar *s = src;
1356   gsize n = dest_size;
1357
1358   g_return_val_if_fail (dest != NULL, 0);
1359   g_return_val_if_fail (src  != NULL, 0);
1360
1361   /* Copy as many bytes as will fit */
1362   if (n != 0 && --n != 0)
1363     do
1364       {
1365         gchar c = *s++;
1366
1367         *d++ = c;
1368         if (c == 0)
1369           break;
1370       }
1371     while (--n != 0);
1372
1373   /* If not enough room in dest, add NUL and traverse rest of src */
1374   if (n == 0)
1375     {
1376       if (dest_size != 0)
1377         *d = 0;
1378       while (*s++)
1379         ;
1380     }
1381
1382   return s - src - 1;  /* count does not include NUL */
1383 }
1384
1385 /**
1386  * g_strlcat:
1387  * @dest: destination buffer, already containing one nul-terminated string
1388  * @src: source buffer
1389  * @dest_size: length of @dest buffer in bytes (not length of existing string
1390  *     inside @dest)
1391  *
1392  * Portability wrapper that calls strlcat() on systems which have it,
1393  * and emulates it otherwise. Appends nul-terminated @src string to @dest,
1394  * guaranteeing nul-termination for @dest. The total size of @dest won't
1395  * exceed @dest_size.
1396  *
1397  * At most @dest_size - 1 characters will be copied. Unlike strncat(),
1398  * @dest_size is the full size of dest, not the space left over. This
1399  * function does not allocate memory. It always nul-terminates (unless
1400  * @dest_size == 0 or there were no nul characters in the @dest_size
1401  * characters of dest to start with).
1402  *
1403  * Caveat: this is supposedly a more secure alternative to strcat() or
1404  * strncat(), but for real security g_strconcat() is harder to mess up.
1405  *
1406  * Returns: size of attempted result, which is MIN (dest_size, strlen
1407  *     (original dest)) + strlen (src), so if retval >= dest_size,
1408  *     truncation occurred.
1409  */
1410 gsize
1411 g_strlcat (gchar       *dest,
1412            const gchar *src,
1413            gsize        dest_size)
1414 {
1415   gchar *d = dest;
1416   const gchar *s = src;
1417   gsize bytes_left = dest_size;
1418   gsize dlength;  /* Logically, MIN (strlen (d), dest_size) */
1419
1420   g_return_val_if_fail (dest != NULL, 0);
1421   g_return_val_if_fail (src  != NULL, 0);
1422
1423   /* Find the end of dst and adjust bytes left but don't go past end */
1424   while (*d != 0 && bytes_left-- != 0)
1425     d++;
1426   dlength = d - dest;
1427   bytes_left = dest_size - dlength;
1428
1429   if (bytes_left == 0)
1430     return dlength + strlen (s);
1431
1432   while (*s != 0)
1433     {
1434       if (bytes_left != 1)
1435         {
1436           *d++ = *s;
1437           bytes_left--;
1438         }
1439       s++;
1440     }
1441   *d = 0;
1442
1443   return dlength + (s - src);  /* count does not include NUL */
1444 }
1445 #endif /* ! HAVE_STRLCPY */
1446
1447 /**
1448  * g_ascii_strdown:
1449  * @str: a string
1450  * @len: length of @str in bytes, or -1 if @str is nul-terminated
1451  *
1452  * Converts all upper case ASCII letters to lower case ASCII letters.
1453  *
1454  * Returns: a newly-allocated string, with all the upper case
1455  *     characters in @str converted to lower case, with semantics that
1456  *     exactly match g_ascii_tolower(). (Note that this is unlike the
1457  *     old g_strdown(), which modified the string in place.)
1458  */
1459 gchar*
1460 g_ascii_strdown (const gchar *str,
1461                  gssize       len)
1462 {
1463   gchar *result, *s;
1464
1465   g_return_val_if_fail (str != NULL, NULL);
1466
1467   if (len < 0)
1468     len = strlen (str);
1469
1470   result = g_strndup (str, len);
1471   for (s = result; *s; s++)
1472     *s = g_ascii_tolower (*s);
1473
1474   return result;
1475 }
1476
1477 /**
1478  * g_ascii_strup:
1479  * @str: a string
1480  * @len: length of @str in bytes, or -1 if @str is nul-terminated
1481  *
1482  * Converts all lower case ASCII letters to upper case ASCII letters.
1483  *
1484  * Returns: a newly allocated string, with all the lower case
1485  *     characters in @str converted to upper case, with semantics that
1486  *     exactly match g_ascii_toupper(). (Note that this is unlike the
1487  *     old g_strup(), which modified the string in place.)
1488  */
1489 gchar*
1490 g_ascii_strup (const gchar *str,
1491                gssize       len)
1492 {
1493   gchar *result, *s;
1494
1495   g_return_val_if_fail (str != NULL, NULL);
1496
1497   if (len < 0)
1498     len = strlen (str);
1499
1500   result = g_strndup (str, len);
1501   for (s = result; *s; s++)
1502     *s = g_ascii_toupper (*s);
1503
1504   return result;
1505 }
1506
1507 /**
1508  * g_str_is_ascii:
1509  * @str: a string
1510  *
1511  * Determines if a string is pure ASCII. A string is pure ASCII if it
1512  * contains no bytes with the high bit set.
1513  *
1514  * Returns: %TRUE if @str is ASCII
1515  *
1516  * Since: 2.40
1517  */
1518 gboolean
1519 g_str_is_ascii (const gchar *str)
1520 {
1521   gint i;
1522
1523   for (i = 0; str[i]; i++)
1524     if (str[i] & 0x80)
1525       return FALSE;
1526
1527   return TRUE;
1528 }
1529
1530 /**
1531  * g_strdown:
1532  * @string: the string to convert.
1533  *
1534  * Converts a string to lower case.
1535  *
1536  * Returns: the string
1537  *
1538  * Deprecated:2.2: This function is totally broken for the reasons discussed
1539  * in the g_strncasecmp() docs - use g_ascii_strdown() or g_utf8_strdown()
1540  * instead.
1541  **/
1542 gchar*
1543 g_strdown (gchar *string)
1544 {
1545   guchar *s;
1546
1547   g_return_val_if_fail (string != NULL, NULL);
1548
1549   s = (guchar *) string;
1550
1551   while (*s)
1552     {
1553       if (isupper (*s))
1554         *s = tolower (*s);
1555       s++;
1556     }
1557
1558   return (gchar *) string;
1559 }
1560
1561 /**
1562  * g_strup:
1563  * @string: the string to convert
1564  *
1565  * Converts a string to upper case.
1566  *
1567  * Returns: the string
1568  *
1569  * Deprecated:2.2: This function is totally broken for the reasons
1570  *     discussed in the g_strncasecmp() docs - use g_ascii_strup()
1571  *     or g_utf8_strup() instead.
1572  */
1573 gchar*
1574 g_strup (gchar *string)
1575 {
1576   guchar *s;
1577
1578   g_return_val_if_fail (string != NULL, NULL);
1579
1580   s = (guchar *) string;
1581
1582   while (*s)
1583     {
1584       if (islower (*s))
1585         *s = toupper (*s);
1586       s++;
1587     }
1588
1589   return (gchar *) string;
1590 }
1591
1592 /**
1593  * g_strreverse:
1594  * @string: the string to reverse
1595  *
1596  * Reverses all of the bytes in a string. For example,
1597  * `g_strreverse ("abcdef")` will result in "fedcba".
1598  *
1599  * Note that g_strreverse() doesn't work on UTF-8 strings
1600  * containing multibyte characters. For that purpose, use
1601  * g_utf8_strreverse().
1602  *
1603  * Returns: the same pointer passed in as @string
1604  */
1605 gchar*
1606 g_strreverse (gchar *string)
1607 {
1608   g_return_val_if_fail (string != NULL, NULL);
1609
1610   if (*string)
1611     {
1612       gchar *h, *t;
1613
1614       h = string;
1615       t = string + strlen (string) - 1;
1616
1617       while (h < t)
1618         {
1619           gchar c;
1620
1621           c = *h;
1622           *h = *t;
1623           h++;
1624           *t = c;
1625           t--;
1626         }
1627     }
1628
1629   return string;
1630 }
1631
1632 /**
1633  * g_ascii_tolower:
1634  * @c: any character
1635  *
1636  * Convert a character to ASCII lower case.
1637  *
1638  * Unlike the standard C library tolower() function, this only
1639  * recognizes standard ASCII letters and ignores the locale, returning
1640  * all non-ASCII characters unchanged, even if they are lower case
1641  * letters in a particular character set. Also unlike the standard
1642  * library function, this takes and returns a char, not an int, so
1643  * don't call it on %EOF but no need to worry about casting to #guchar
1644  * before passing a possibly non-ASCII character in.
1645  *
1646  * Returns: the result of converting @c to lower case. If @c is
1647  *     not an ASCII upper case letter, @c is returned unchanged.
1648  */
1649 gchar
1650 g_ascii_tolower (gchar c)
1651 {
1652   return g_ascii_isupper (c) ? c - 'A' + 'a' : c;
1653 }
1654
1655 /**
1656  * g_ascii_toupper:
1657  * @c: any character
1658  *
1659  * Convert a character to ASCII upper case.
1660  *
1661  * Unlike the standard C library toupper() function, this only
1662  * recognizes standard ASCII letters and ignores the locale, returning
1663  * all non-ASCII characters unchanged, even if they are upper case
1664  * letters in a particular character set. Also unlike the standard
1665  * library function, this takes and returns a char, not an int, so
1666  * don't call it on %EOF but no need to worry about casting to #guchar
1667  * before passing a possibly non-ASCII character in.
1668  *
1669  * Returns: the result of converting @c to upper case. If @c is not
1670  *    an ASCII lower case letter, @c is returned unchanged.
1671  */
1672 gchar
1673 g_ascii_toupper (gchar c)
1674 {
1675   return g_ascii_islower (c) ? c - 'a' + 'A' : c;
1676 }
1677
1678 /**
1679  * g_ascii_digit_value:
1680  * @c: an ASCII character
1681  *
1682  * Determines the numeric value of a character as a decimal digit.
1683  * Differs from g_unichar_digit_value() because it takes a char, so
1684  * there's no worry about sign extension if characters are signed.
1685  *
1686  * Returns: If @c is a decimal digit (according to g_ascii_isdigit()),
1687  *    its numeric value. Otherwise, -1.
1688  */
1689 int
1690 g_ascii_digit_value (gchar c)
1691 {
1692   if (g_ascii_isdigit (c))
1693     return c - '0';
1694   return -1;
1695 }
1696
1697 /**
1698  * g_ascii_xdigit_value:
1699  * @c: an ASCII character.
1700  *
1701  * Determines the numeric value of a character as a hexidecimal
1702  * digit. Differs from g_unichar_xdigit_value() because it takes
1703  * a char, so there's no worry about sign extension if characters
1704  * are signed.
1705  *
1706  * Returns: If @c is a hex digit (according to g_ascii_isxdigit()),
1707  *     its numeric value. Otherwise, -1.
1708  */
1709 int
1710 g_ascii_xdigit_value (gchar c)
1711 {
1712   if (c >= 'A' && c <= 'F')
1713     return c - 'A' + 10;
1714   if (c >= 'a' && c <= 'f')
1715     return c - 'a' + 10;
1716   return g_ascii_digit_value (c);
1717 }
1718
1719 /**
1720  * g_ascii_strcasecmp:
1721  * @s1: string to compare with @s2
1722  * @s2: string to compare with @s1
1723  *
1724  * Compare two strings, ignoring the case of ASCII characters.
1725  *
1726  * Unlike the BSD strcasecmp() function, this only recognizes standard
1727  * ASCII letters and ignores the locale, treating all non-ASCII
1728  * bytes as if they are not letters.
1729  *
1730  * This function should be used only on strings that are known to be
1731  * in encodings where the bytes corresponding to ASCII letters always
1732  * represent themselves. This includes UTF-8 and the ISO-8859-*
1733  * charsets, but not for instance double-byte encodings like the
1734  * Windows Codepage 932, where the trailing bytes of double-byte
1735  * characters include all ASCII letters. If you compare two CP932
1736  * strings using this function, you will get false matches.
1737  *
1738  * Both @s1 and @s2 must be non-%NULL.
1739  *
1740  * Returns: 0 if the strings match, a negative value if @s1 < @s2,
1741  *     or a positive value if @s1 > @s2.
1742  */
1743 gint
1744 g_ascii_strcasecmp (const gchar *s1,
1745                     const gchar *s2)
1746 {
1747   gint c1, c2;
1748
1749   g_return_val_if_fail (s1 != NULL, 0);
1750   g_return_val_if_fail (s2 != NULL, 0);
1751
1752   while (*s1 && *s2)
1753     {
1754       c1 = (gint)(guchar) TOLOWER (*s1);
1755       c2 = (gint)(guchar) TOLOWER (*s2);
1756       if (c1 != c2)
1757         return (c1 - c2);
1758       s1++; s2++;
1759     }
1760
1761   return (((gint)(guchar) *s1) - ((gint)(guchar) *s2));
1762 }
1763
1764 /**
1765  * g_ascii_strncasecmp:
1766  * @s1: string to compare with @s2
1767  * @s2: string to compare with @s1
1768  * @n: number of characters to compare
1769  *
1770  * Compare @s1 and @s2, ignoring the case of ASCII characters and any
1771  * characters after the first @n in each string.
1772  *
1773  * Unlike the BSD strcasecmp() function, this only recognizes standard
1774  * ASCII letters and ignores the locale, treating all non-ASCII
1775  * characters as if they are not letters.
1776  *
1777  * The same warning as in g_ascii_strcasecmp() applies: Use this
1778  * function only on strings known to be in encodings where bytes
1779  * corresponding to ASCII letters always represent themselves.
1780  *
1781  * Returns: 0 if the strings match, a negative value if @s1 < @s2,
1782  *     or a positive value if @s1 > @s2.
1783  */
1784 gint
1785 g_ascii_strncasecmp (const gchar *s1,
1786                      const gchar *s2,
1787                      gsize        n)
1788 {
1789   gint c1, c2;
1790
1791   g_return_val_if_fail (s1 != NULL, 0);
1792   g_return_val_if_fail (s2 != NULL, 0);
1793
1794   while (n && *s1 && *s2)
1795     {
1796       n -= 1;
1797       c1 = (gint)(guchar) TOLOWER (*s1);
1798       c2 = (gint)(guchar) TOLOWER (*s2);
1799       if (c1 != c2)
1800         return (c1 - c2);
1801       s1++; s2++;
1802     }
1803
1804   if (n)
1805     return (((gint) (guchar) *s1) - ((gint) (guchar) *s2));
1806   else
1807     return 0;
1808 }
1809
1810 /**
1811  * g_strcasecmp:
1812  * @s1: a string
1813  * @s2: a string to compare with @s1
1814  *
1815  * A case-insensitive string comparison, corresponding to the standard
1816  * strcasecmp() function on platforms which support it.
1817  *
1818  * Returns: 0 if the strings match, a negative value if @s1 < @s2,
1819  *     or a positive value if @s1 > @s2.
1820  *
1821  * Deprecated:2.2: See g_strncasecmp() for a discussion of why this
1822  *     function is deprecated and how to replace it.
1823  */
1824 gint
1825 g_strcasecmp (const gchar *s1,
1826               const gchar *s2)
1827 {
1828 #ifdef HAVE_STRCASECMP
1829   g_return_val_if_fail (s1 != NULL, 0);
1830   g_return_val_if_fail (s2 != NULL, 0);
1831
1832   return strcasecmp (s1, s2);
1833 #else
1834   gint c1, c2;
1835
1836   g_return_val_if_fail (s1 != NULL, 0);
1837   g_return_val_if_fail (s2 != NULL, 0);
1838
1839   while (*s1 && *s2)
1840     {
1841       /* According to A. Cox, some platforms have islower's that
1842        * don't work right on non-uppercase
1843        */
1844       c1 = isupper ((guchar)*s1) ? tolower ((guchar)*s1) : *s1;
1845       c2 = isupper ((guchar)*s2) ? tolower ((guchar)*s2) : *s2;
1846       if (c1 != c2)
1847         return (c1 - c2);
1848       s1++; s2++;
1849     }
1850
1851   return (((gint)(guchar) *s1) - ((gint)(guchar) *s2));
1852 #endif
1853 }
1854
1855 /**
1856  * g_strncasecmp:
1857  * @s1: a string
1858  * @s2: a string to compare with @s1
1859  * @n: the maximum number of characters to compare
1860  *
1861  * A case-insensitive string comparison, corresponding to the standard
1862  * strncasecmp() function on platforms which support it. It is similar
1863  * to g_strcasecmp() except it only compares the first @n characters of
1864  * the strings.
1865  *
1866  * Returns: 0 if the strings match, a negative value if @s1 < @s2,
1867  *     or a positive value if @s1 > @s2.
1868  *
1869  * Deprecated:2.2: The problem with g_strncasecmp() is that it does
1870  *     the comparison by calling toupper()/tolower(). These functions
1871  *     are locale-specific and operate on single bytes. However, it is
1872  *     impossible to handle things correctly from an internationalization
1873  *     standpoint by operating on bytes, since characters may be multibyte.
1874  *     Thus g_strncasecmp() is broken if your string is guaranteed to be
1875  *     ASCII, since it is locale-sensitive, and it's broken if your string
1876  *     is localized, since it doesn't work on many encodings at all,
1877  *     including UTF-8, EUC-JP, etc.
1878  *
1879  *     There are therefore two replacement techniques: g_ascii_strncasecmp(),
1880  *     which only works on ASCII and is not locale-sensitive, and
1881  *     g_utf8_casefold() followed by strcmp() on the resulting strings,
1882  *     which is good for case-insensitive sorting of UTF-8.
1883  */
1884 gint
1885 g_strncasecmp (const gchar *s1,
1886                const gchar *s2,
1887                guint n)
1888 {
1889 #ifdef HAVE_STRNCASECMP
1890   return strncasecmp (s1, s2, n);
1891 #else
1892   gint c1, c2;
1893
1894   g_return_val_if_fail (s1 != NULL, 0);
1895   g_return_val_if_fail (s2 != NULL, 0);
1896
1897   while (n && *s1 && *s2)
1898     {
1899       n -= 1;
1900       /* According to A. Cox, some platforms have islower's that
1901        * don't work right on non-uppercase
1902        */
1903       c1 = isupper ((guchar)*s1) ? tolower ((guchar)*s1) : *s1;
1904       c2 = isupper ((guchar)*s2) ? tolower ((guchar)*s2) : *s2;
1905       if (c1 != c2)
1906         return (c1 - c2);
1907       s1++; s2++;
1908     }
1909
1910   if (n)
1911     return (((gint) (guchar) *s1) - ((gint) (guchar) *s2));
1912   else
1913     return 0;
1914 #endif
1915 }
1916
1917 /**
1918  * g_strdelimit:
1919  * @string: the string to convert
1920  * @delimiters: (allow-none): a string containing the current delimiters,
1921  *     or %NULL to use the standard delimiters defined in #G_STR_DELIMITERS
1922  * @new_delimiter: the new delimiter character
1923  *
1924  * Converts any delimiter characters in @string to @new_delimiter.
1925  * Any characters in @string which are found in @delimiters are
1926  * changed to the @new_delimiter character. Modifies @string in place,
1927  * and returns @string itself, not a copy. The return value is to
1928  * allow nesting such as
1929  * |[<!-- language="C" -->
1930  *   g_ascii_strup (g_strdelimit (str, "abc", '?'))
1931  * ]|
1932  *
1933  * Returns: @string
1934  */
1935 gchar *
1936 g_strdelimit (gchar       *string,
1937               const gchar *delimiters,
1938               gchar        new_delim)
1939 {
1940   gchar *c;
1941
1942   g_return_val_if_fail (string != NULL, NULL);
1943
1944   if (!delimiters)
1945     delimiters = G_STR_DELIMITERS;
1946
1947   for (c = string; *c; c++)
1948     {
1949       if (strchr (delimiters, *c))
1950         *c = new_delim;
1951     }
1952
1953   return string;
1954 }
1955
1956 /**
1957  * g_strcanon:
1958  * @string: a nul-terminated array of bytes
1959  * @valid_chars: bytes permitted in @string
1960  * @substitutor: replacement character for disallowed bytes
1961  *
1962  * For each character in @string, if the character is not in @valid_chars,
1963  * replaces the character with @substitutor. Modifies @string in place,
1964  * and return @string itself, not a copy. The return value is to allow
1965  * nesting such as
1966  * |[<!-- language="C" -->
1967  *   g_ascii_strup (g_strcanon (str, "abc", '?'))
1968  * ]|
1969  *
1970  * Returns: @string
1971  */
1972 gchar *
1973 g_strcanon (gchar       *string,
1974             const gchar *valid_chars,
1975             gchar        substitutor)
1976 {
1977   gchar *c;
1978
1979   g_return_val_if_fail (string != NULL, NULL);
1980   g_return_val_if_fail (valid_chars != NULL, NULL);
1981
1982   for (c = string; *c; c++)
1983     {
1984       if (!strchr (valid_chars, *c))
1985         *c = substitutor;
1986     }
1987
1988   return string;
1989 }
1990
1991 /**
1992  * g_strcompress:
1993  * @source: a string to compress
1994  *
1995  * Replaces all escaped characters with their one byte equivalent.
1996  *
1997  * This function does the reverse conversion of g_strescape().
1998  *
1999  * Returns: a newly-allocated copy of @source with all escaped
2000  *     character compressed
2001  */
2002 gchar *
2003 g_strcompress (const gchar *source)
2004 {
2005   const gchar *p = source, *octal;
2006   gchar *dest;
2007   gchar *q;
2008
2009   g_return_val_if_fail (source != NULL, NULL);
2010
2011   dest = g_malloc (strlen (source) + 1);
2012   q = dest;
2013
2014   while (*p)
2015     {
2016       if (*p == '\\')
2017         {
2018           p++;
2019           switch (*p)
2020             {
2021             case '\0':
2022               g_warning ("g_strcompress: trailing \\");
2023               goto out;
2024             case '0':  case '1':  case '2':  case '3':  case '4':
2025             case '5':  case '6':  case '7':
2026               *q = 0;
2027               octal = p;
2028               while ((p < octal + 3) && (*p >= '0') && (*p <= '7'))
2029                 {
2030                   *q = (*q * 8) + (*p - '0');
2031                   p++;
2032                 }
2033               q++;
2034               p--;
2035               break;
2036             case 'b':
2037               *q++ = '\b';
2038               break;
2039             case 'f':
2040               *q++ = '\f';
2041               break;
2042             case 'n':
2043               *q++ = '\n';
2044               break;
2045             case 'r':
2046               *q++ = '\r';
2047               break;
2048             case 't':
2049               *q++ = '\t';
2050               break;
2051             case 'v':
2052               *q++ = '\v';
2053               break;
2054             default:            /* Also handles \" and \\ */
2055               *q++ = *p;
2056               break;
2057             }
2058         }
2059       else
2060         *q++ = *p;
2061       p++;
2062     }
2063 out:
2064   *q = 0;
2065
2066   return dest;
2067 }
2068
2069 /**
2070  * g_strescape:
2071  * @source: a string to escape
2072  * @exceptions: a string of characters not to escape in @source
2073  *
2074  * Escapes the special characters '\b', '\f', '\n', '\r', '\t', '\v', '\'
2075  * and '&quot;' in the string @source by inserting a '\' before
2076  * them. Additionally all characters in the range 0x01-0x1F (everything
2077  * below SPACE) and in the range 0x7F-0xFF (all non-ASCII chars) are
2078  * replaced with a '\' followed by their octal representation.
2079  * Characters supplied in @exceptions are not escaped.
2080  *
2081  * g_strcompress() does the reverse conversion.
2082  *
2083  * Returns: a newly-allocated copy of @source with certain
2084  *     characters escaped. See above.
2085  */
2086 gchar *
2087 g_strescape (const gchar *source,
2088              const gchar *exceptions)
2089 {
2090   const guchar *p;
2091   gchar *dest;
2092   gchar *q;
2093   guchar excmap[256];
2094
2095   g_return_val_if_fail (source != NULL, NULL);
2096
2097   p = (guchar *) source;
2098   /* Each source byte needs maximally four destination chars (\777) */
2099   q = dest = g_malloc (strlen (source) * 4 + 1);
2100
2101   memset (excmap, 0, 256);
2102   if (exceptions)
2103     {
2104       guchar *e = (guchar *) exceptions;
2105
2106       while (*e)
2107         {
2108           excmap[*e] = 1;
2109           e++;
2110         }
2111     }
2112
2113   while (*p)
2114     {
2115       if (excmap[*p])
2116         *q++ = *p;
2117       else
2118         {
2119           switch (*p)
2120             {
2121             case '\b':
2122               *q++ = '\\';
2123               *q++ = 'b';
2124               break;
2125             case '\f':
2126               *q++ = '\\';
2127               *q++ = 'f';
2128               break;
2129             case '\n':
2130               *q++ = '\\';
2131               *q++ = 'n';
2132               break;
2133             case '\r':
2134               *q++ = '\\';
2135               *q++ = 'r';
2136               break;
2137             case '\t':
2138               *q++ = '\\';
2139               *q++ = 't';
2140               break;
2141             case '\v':
2142               *q++ = '\\';
2143               *q++ = 'v';
2144               break;
2145             case '\\':
2146               *q++ = '\\';
2147               *q++ = '\\';
2148               break;
2149             case '"':
2150               *q++ = '\\';
2151               *q++ = '"';
2152               break;
2153             default:
2154               if ((*p < ' ') || (*p >= 0177))
2155                 {
2156                   *q++ = '\\';
2157                   *q++ = '0' + (((*p) >> 6) & 07);
2158                   *q++ = '0' + (((*p) >> 3) & 07);
2159                   *q++ = '0' + ((*p) & 07);
2160                 }
2161               else
2162                 *q++ = *p;
2163               break;
2164             }
2165         }
2166       p++;
2167     }
2168   *q = 0;
2169   return dest;
2170 }
2171
2172 /**
2173  * g_strchug:
2174  * @string: a string to remove the leading whitespace from
2175  *
2176  * Removes leading whitespace from a string, by moving the rest
2177  * of the characters forward.
2178  *
2179  * This function doesn't allocate or reallocate any memory;
2180  * it modifies @string in place. Therefore, it cannot be used on
2181  * statically allocated strings.
2182  *
2183  * The pointer to @string is returned to allow the nesting of functions.
2184  *
2185  * Also see g_strchomp() and g_strstrip().
2186  *
2187  * Returns: @string
2188  */
2189 gchar *
2190 g_strchug (gchar *string)
2191 {
2192   guchar *start;
2193
2194   g_return_val_if_fail (string != NULL, NULL);
2195
2196   for (start = (guchar*) string; *start && g_ascii_isspace (*start); start++)
2197     ;
2198
2199   memmove (string, start, strlen ((gchar *) start) + 1);
2200
2201   return string;
2202 }
2203
2204 /**
2205  * g_strchomp:
2206  * @string: a string to remove the trailing whitespace from
2207  *
2208  * Removes trailing whitespace from a string.
2209  *
2210  * This function doesn't allocate or reallocate any memory;
2211  * it modifies @string in place. Therefore, it cannot be used
2212  * on statically allocated strings.
2213  *
2214  * The pointer to @string is returned to allow the nesting of functions.
2215  *
2216  * Also see g_strchug() and g_strstrip().
2217  *
2218  * Returns: @string
2219  */
2220 gchar *
2221 g_strchomp (gchar *string)
2222 {
2223   gsize len;
2224
2225   g_return_val_if_fail (string != NULL, NULL);
2226
2227   len = strlen (string);
2228   while (len--)
2229     {
2230       if (g_ascii_isspace ((guchar) string[len]))
2231         string[len] = '\0';
2232       else
2233         break;
2234     }
2235
2236   return string;
2237 }
2238
2239 /**
2240  * g_strsplit:
2241  * @string: a string to split
2242  * @delimiter: a string which specifies the places at which to split
2243  *     the string. The delimiter is not included in any of the resulting
2244  *     strings, unless @max_tokens is reached.
2245  * @max_tokens: the maximum number of pieces to split @string into.
2246  *     If this is less than 1, the string is split completely.
2247  *
2248  * Splits a string into a maximum of @max_tokens pieces, using the given
2249  * @delimiter. If @max_tokens is reached, the remainder of @string is
2250  * appended to the last token.
2251  *
2252  * As an example, the result of g_strsplit (":a:bc::d:", ":", -1) is a
2253  * %NULL-terminated vector containing the six strings "", "a", "bc", "", "d"
2254  * and "".
2255  *
2256  * As a special case, the result of splitting the empty string "" is an empty
2257  * vector, not a vector containing a single string. The reason for this
2258  * special case is that being able to represent a empty vector is typically
2259  * more useful than consistent handling of empty elements. If you do need
2260  * to represent empty elements, you'll need to check for the empty string
2261  * before calling g_strsplit().
2262  *
2263  * Returns: a newly-allocated %NULL-terminated array of strings. Use
2264  *    g_strfreev() to free it.
2265  */
2266 gchar**
2267 g_strsplit (const gchar *string,
2268             const gchar *delimiter,
2269             gint         max_tokens)
2270 {
2271   GSList *string_list = NULL, *slist;
2272   gchar **str_array, *s;
2273   guint n = 0;
2274   const gchar *remainder;
2275
2276   g_return_val_if_fail (string != NULL, NULL);
2277   g_return_val_if_fail (delimiter != NULL, NULL);
2278   g_return_val_if_fail (delimiter[0] != '\0', NULL);
2279
2280   if (max_tokens < 1)
2281     max_tokens = G_MAXINT;
2282
2283   remainder = string;
2284   s = strstr (remainder, delimiter);
2285   if (s)
2286     {
2287       gsize delimiter_len = strlen (delimiter);
2288
2289       while (--max_tokens && s)
2290         {
2291           gsize len;
2292
2293           len = s - remainder;
2294           string_list = g_slist_prepend (string_list,
2295                                          g_strndup (remainder, len));
2296           n++;
2297           remainder = s + delimiter_len;
2298           s = strstr (remainder, delimiter);
2299         }
2300     }
2301   if (*string)
2302     {
2303       n++;
2304       string_list = g_slist_prepend (string_list, g_strdup (remainder));
2305     }
2306
2307   str_array = g_new (gchar*, n + 1);
2308
2309   str_array[n--] = NULL;
2310   for (slist = string_list; slist; slist = slist->next)
2311     str_array[n--] = slist->data;
2312
2313   g_slist_free (string_list);
2314
2315   return str_array;
2316 }
2317
2318 /**
2319  * g_strsplit_set:
2320  * @string: The string to be tokenized
2321  * @delimiters: A nul-terminated string containing bytes that are used
2322  *     to split the string.
2323  * @max_tokens: The maximum number of tokens to split @string into.
2324  *     If this is less than 1, the string is split completely
2325  *
2326  * Splits @string into a number of tokens not containing any of the characters
2327  * in @delimiter. A token is the (possibly empty) longest string that does not
2328  * contain any of the characters in @delimiters. If @max_tokens is reached, the
2329  * remainder is appended to the last token.
2330  *
2331  * For example the result of g_strsplit_set ("abc:def/ghi", ":/", -1) is a
2332  * %NULL-terminated vector containing the three strings "abc", "def",
2333  * and "ghi".
2334  *
2335  * The result of g_strsplit_set (":def/ghi:", ":/", -1) is a %NULL-terminated
2336  * vector containing the four strings "", "def", "ghi", and "".
2337  *
2338  * As a special case, the result of splitting the empty string "" is an empty
2339  * vector, not a vector containing a single string. The reason for this
2340  * special case is that being able to represent a empty vector is typically
2341  * more useful than consistent handling of empty elements. If you do need
2342  * to represent empty elements, you'll need to check for the empty string
2343  * before calling g_strsplit_set().
2344  *
2345  * Note that this function works on bytes not characters, so it can't be used
2346  * to delimit UTF-8 strings for anything but ASCII characters.
2347  *
2348  * Returns: a newly-allocated %NULL-terminated array of strings. Use
2349  *    g_strfreev() to free it.
2350  *
2351  * Since: 2.4
2352  **/
2353 gchar **
2354 g_strsplit_set (const gchar *string,
2355                 const gchar *delimiters,
2356                 gint         max_tokens)
2357 {
2358   gboolean delim_table[256];
2359   GSList *tokens, *list;
2360   gint n_tokens;
2361   const gchar *s;
2362   const gchar *current;
2363   gchar *token;
2364   gchar **result;
2365
2366   g_return_val_if_fail (string != NULL, NULL);
2367   g_return_val_if_fail (delimiters != NULL, NULL);
2368
2369   if (max_tokens < 1)
2370     max_tokens = G_MAXINT;
2371
2372   if (*string == '\0')
2373     {
2374       result = g_new (char *, 1);
2375       result[0] = NULL;
2376       return result;
2377     }
2378
2379   memset (delim_table, FALSE, sizeof (delim_table));
2380   for (s = delimiters; *s != '\0'; ++s)
2381     delim_table[*(guchar *)s] = TRUE;
2382
2383   tokens = NULL;
2384   n_tokens = 0;
2385
2386   s = current = string;
2387   while (*s != '\0')
2388     {
2389       if (delim_table[*(guchar *)s] && n_tokens + 1 < max_tokens)
2390         {
2391           token = g_strndup (current, s - current);
2392           tokens = g_slist_prepend (tokens, token);
2393           ++n_tokens;
2394
2395           current = s + 1;
2396         }
2397
2398       ++s;
2399     }
2400
2401   token = g_strndup (current, s - current);
2402   tokens = g_slist_prepend (tokens, token);
2403   ++n_tokens;
2404
2405   result = g_new (gchar *, n_tokens + 1);
2406
2407   result[n_tokens] = NULL;
2408   for (list = tokens; list != NULL; list = list->next)
2409     result[--n_tokens] = list->data;
2410
2411   g_slist_free (tokens);
2412
2413   return result;
2414 }
2415
2416 /**
2417  * g_strfreev:
2418  * @str_array: a %NULL-terminated array of strings to free
2419  *
2420  * Frees a %NULL-terminated array of strings, as well as each
2421  * string it contains.
2422  *
2423  * If @str_array is %NULL, this function simply returns.
2424  */
2425 void
2426 g_strfreev (gchar **str_array)
2427 {
2428   if (str_array)
2429     {
2430       int i;
2431
2432       for (i = 0; str_array[i] != NULL; i++)
2433         g_free (str_array[i]);
2434
2435       g_free (str_array);
2436     }
2437 }
2438
2439 /**
2440  * g_strdupv:
2441  * @str_array: a %NULL-terminated array of strings
2442  *
2443  * Copies %NULL-terminated array of strings. The copy is a deep copy;
2444  * the new array should be freed by first freeing each string, then
2445  * the array itself. g_strfreev() does this for you. If called
2446  * on a %NULL value, g_strdupv() simply returns %NULL.
2447  *
2448  * Returns: a new %NULL-terminated array of strings.
2449  */
2450 gchar**
2451 g_strdupv (gchar **str_array)
2452 {
2453   if (str_array)
2454     {
2455       gint i;
2456       gchar **retval;
2457
2458       i = 0;
2459       while (str_array[i])
2460         ++i;
2461
2462       retval = g_new (gchar*, i + 1);
2463
2464       i = 0;
2465       while (str_array[i])
2466         {
2467           retval[i] = g_strdup (str_array[i]);
2468           ++i;
2469         }
2470       retval[i] = NULL;
2471
2472       return retval;
2473     }
2474   else
2475     return NULL;
2476 }
2477
2478 /**
2479  * g_strjoinv:
2480  * @separator: (allow-none): a string to insert between each of the
2481  *     strings, or %NULL
2482  * @str_array: a %NULL-terminated array of strings to join
2483  *
2484  * Joins a number of strings together to form one long string, with the
2485  * optional @separator inserted between each of them. The returned string
2486  * should be freed with g_free().
2487  *
2488  * Returns: a newly-allocated string containing all of the strings joined
2489  *     together, with @separator between them
2490  */
2491 gchar*
2492 g_strjoinv (const gchar  *separator,
2493             gchar       **str_array)
2494 {
2495   gchar *string;
2496   gchar *ptr;
2497
2498   g_return_val_if_fail (str_array != NULL, NULL);
2499
2500   if (separator == NULL)
2501     separator = "";
2502
2503   if (*str_array)
2504     {
2505       gint i;
2506       gsize len;
2507       gsize separator_len;
2508
2509       separator_len = strlen (separator);
2510       /* First part, getting length */
2511       len = 1 + strlen (str_array[0]);
2512       for (i = 1; str_array[i] != NULL; i++)
2513         len += strlen (str_array[i]);
2514       len += separator_len * (i - 1);
2515
2516       /* Second part, building string */
2517       string = g_new (gchar, len);
2518       ptr = g_stpcpy (string, *str_array);
2519       for (i = 1; str_array[i] != NULL; i++)
2520         {
2521           ptr = g_stpcpy (ptr, separator);
2522           ptr = g_stpcpy (ptr, str_array[i]);
2523         }
2524       }
2525   else
2526     string = g_strdup ("");
2527
2528   return string;
2529 }
2530
2531 /**
2532  * g_strjoin:
2533  * @separator: (allow-none): a string to insert between each of the
2534  *     strings, or %NULL
2535  * @...: a %NULL-terminated list of strings to join
2536  *
2537  * Joins a number of strings together to form one long string, with the
2538  * optional @separator inserted between each of them. The returned string
2539  * should be freed with g_free().
2540  *
2541  * Returns: a newly-allocated string containing all of the strings joined
2542  *     together, with @separator between them
2543  */
2544 gchar*
2545 g_strjoin (const gchar *separator,
2546            ...)
2547 {
2548   gchar *string, *s;
2549   va_list args;
2550   gsize len;
2551   gsize separator_len;
2552   gchar *ptr;
2553
2554   if (separator == NULL)
2555     separator = "";
2556
2557   separator_len = strlen (separator);
2558
2559   va_start (args, separator);
2560
2561   s = va_arg (args, gchar*);
2562
2563   if (s)
2564     {
2565       /* First part, getting length */
2566       len = 1 + strlen (s);
2567
2568       s = va_arg (args, gchar*);
2569       while (s)
2570         {
2571           len += separator_len + strlen (s);
2572           s = va_arg (args, gchar*);
2573         }
2574       va_end (args);
2575
2576       /* Second part, building string */
2577       string = g_new (gchar, len);
2578
2579       va_start (args, separator);
2580
2581       s = va_arg (args, gchar*);
2582       ptr = g_stpcpy (string, s);
2583
2584       s = va_arg (args, gchar*);
2585       while (s)
2586         {
2587           ptr = g_stpcpy (ptr, separator);
2588           ptr = g_stpcpy (ptr, s);
2589           s = va_arg (args, gchar*);
2590         }
2591     }
2592   else
2593     string = g_strdup ("");
2594
2595   va_end (args);
2596
2597   return string;
2598 }
2599
2600
2601 /**
2602  * g_strstr_len:
2603  * @haystack: a string
2604  * @haystack_len: the maximum length of @haystack. Note that -1 is
2605  *     a valid length, if @haystack is nul-terminated, meaning it will
2606  *     search through the whole string.
2607  * @needle: the string to search for
2608  *
2609  * Searches the string @haystack for the first occurrence
2610  * of the string @needle, limiting the length of the search
2611  * to @haystack_len.
2612  *
2613  * Returns: a pointer to the found occurrence, or
2614  *    %NULL if not found.
2615  */
2616 gchar *
2617 g_strstr_len (const gchar *haystack,
2618               gssize       haystack_len,
2619               const gchar *needle)
2620 {
2621   g_return_val_if_fail (haystack != NULL, NULL);
2622   g_return_val_if_fail (needle != NULL, NULL);
2623
2624   if (haystack_len < 0)
2625     return strstr (haystack, needle);
2626   else
2627     {
2628       const gchar *p = haystack;
2629       gsize needle_len = strlen (needle);
2630       const gchar *end;
2631       gsize i;
2632
2633       if (needle_len == 0)
2634         return (gchar *)haystack;
2635
2636       if (haystack_len < needle_len)
2637         return NULL;
2638
2639       end = haystack + haystack_len - needle_len;
2640
2641       while (p <= end && *p)
2642         {
2643           for (i = 0; i < needle_len; i++)
2644             if (p[i] != needle[i])
2645               goto next;
2646
2647           return (gchar *)p;
2648
2649         next:
2650           p++;
2651         }
2652
2653       return NULL;
2654     }
2655 }
2656
2657 /**
2658  * g_strrstr:
2659  * @haystack: a nul-terminated string
2660  * @needle: the nul-terminated string to search for
2661  *
2662  * Searches the string @haystack for the last occurrence
2663  * of the string @needle.
2664  *
2665  * Returns: a pointer to the found occurrence, or
2666  *    %NULL if not found.
2667  */
2668 gchar *
2669 g_strrstr (const gchar *haystack,
2670            const gchar *needle)
2671 {
2672   gsize i;
2673   gsize needle_len;
2674   gsize haystack_len;
2675   const gchar *p;
2676
2677   g_return_val_if_fail (haystack != NULL, NULL);
2678   g_return_val_if_fail (needle != NULL, NULL);
2679
2680   needle_len = strlen (needle);
2681   haystack_len = strlen (haystack);
2682
2683   if (needle_len == 0)
2684     return (gchar *)haystack;
2685
2686   if (haystack_len < needle_len)
2687     return NULL;
2688
2689   p = haystack + haystack_len - needle_len;
2690
2691   while (p >= haystack)
2692     {
2693       for (i = 0; i < needle_len; i++)
2694         if (p[i] != needle[i])
2695           goto next;
2696
2697       return (gchar *)p;
2698
2699     next:
2700       p--;
2701     }
2702
2703   return NULL;
2704 }
2705
2706 /**
2707  * g_strrstr_len:
2708  * @haystack: a nul-terminated string
2709  * @haystack_len: the maximum length of @haystack
2710  * @needle: the nul-terminated string to search for
2711  *
2712  * Searches the string @haystack for the last occurrence
2713  * of the string @needle, limiting the length of the search
2714  * to @haystack_len.
2715  *
2716  * Returns: a pointer to the found occurrence, or
2717  *    %NULL if not found.
2718  */
2719 gchar *
2720 g_strrstr_len (const gchar *haystack,
2721                gssize        haystack_len,
2722                const gchar *needle)
2723 {
2724   g_return_val_if_fail (haystack != NULL, NULL);
2725   g_return_val_if_fail (needle != NULL, NULL);
2726
2727   if (haystack_len < 0)
2728     return g_strrstr (haystack, needle);
2729   else
2730     {
2731       gsize needle_len = strlen (needle);
2732       const gchar *haystack_max = haystack + haystack_len;
2733       const gchar *p = haystack;
2734       gsize i;
2735
2736       while (p < haystack_max && *p)
2737         p++;
2738
2739       if (p < haystack + needle_len)
2740         return NULL;
2741
2742       p -= needle_len;
2743
2744       while (p >= haystack)
2745         {
2746           for (i = 0; i < needle_len; i++)
2747             if (p[i] != needle[i])
2748               goto next;
2749
2750           return (gchar *)p;
2751
2752         next:
2753           p--;
2754         }
2755
2756       return NULL;
2757     }
2758 }
2759
2760
2761 /**
2762  * g_str_has_suffix:
2763  * @str: a nul-terminated string
2764  * @suffix: the nul-terminated suffix to look for
2765  *
2766  * Looks whether the string @str ends with @suffix.
2767  *
2768  * Returns: %TRUE if @str end with @suffix, %FALSE otherwise.
2769  *
2770  * Since: 2.2
2771  */
2772 gboolean
2773 g_str_has_suffix (const gchar *str,
2774                   const gchar *suffix)
2775 {
2776   int str_len;
2777   int suffix_len;
2778
2779   g_return_val_if_fail (str != NULL, FALSE);
2780   g_return_val_if_fail (suffix != NULL, FALSE);
2781
2782   str_len = strlen (str);
2783   suffix_len = strlen (suffix);
2784
2785   if (str_len < suffix_len)
2786     return FALSE;
2787
2788   return strcmp (str + str_len - suffix_len, suffix) == 0;
2789 }
2790
2791 /**
2792  * g_str_has_prefix:
2793  * @str: a nul-terminated string
2794  * @prefix: the nul-terminated prefix to look for
2795  *
2796  * Looks whether the string @str begins with @prefix.
2797  *
2798  * Returns: %TRUE if @str begins with @prefix, %FALSE otherwise.
2799  *
2800  * Since: 2.2
2801  */
2802 gboolean
2803 g_str_has_prefix (const gchar *str,
2804                   const gchar *prefix)
2805 {
2806   g_return_val_if_fail (str != NULL, FALSE);
2807   g_return_val_if_fail (prefix != NULL, FALSE);
2808
2809   return strncmp (str, prefix, strlen (prefix)) == 0;
2810 }
2811
2812 /**
2813  * g_strv_length:
2814  * @str_array: a %NULL-terminated array of strings
2815  *
2816  * Returns the length of the given %NULL-terminated
2817  * string array @str_array.
2818  *
2819  * Returns: length of @str_array.
2820  *
2821  * Since: 2.6
2822  */
2823 guint
2824 g_strv_length (gchar **str_array)
2825 {
2826   guint i = 0;
2827
2828   g_return_val_if_fail (str_array != NULL, 0);
2829
2830   while (str_array[i])
2831     ++i;
2832
2833   return i;
2834 }
2835
2836 static void
2837 index_add_folded (GPtrArray   *array,
2838                   const gchar *start,
2839                   const gchar *end)
2840 {
2841   gchar *normal;
2842
2843   normal = g_utf8_normalize (start, end - start, G_NORMALIZE_ALL_COMPOSE);
2844
2845   /* TODO: Invent time machine.  Converse with Mustafa Ataturk... */
2846   if (strstr (normal, "ı") || strstr (normal, "İ"))
2847     {
2848       gchar *s = normal;
2849       GString *tmp;
2850
2851       tmp = g_string_new (NULL);
2852
2853       while (*s)
2854         {
2855           gchar *i, *I, *e;
2856
2857           i = strstr (s, "ı");
2858           I = strstr (s, "İ");
2859
2860           if (!i && !I)
2861             break;
2862           else if (i && !I)
2863             e = i;
2864           else if (I && !i)
2865             e = I;
2866           else if (i < I)
2867             e = i;
2868           else
2869             e = I;
2870
2871           g_string_append_len (tmp, s, e - s);
2872           g_string_append_c (tmp, 'i');
2873           s = g_utf8_next_char (e);
2874         }
2875
2876       g_string_append (tmp, s);
2877       g_free (normal);
2878       normal = g_string_free (tmp, FALSE);
2879     }
2880
2881   g_ptr_array_add (array, g_utf8_casefold (normal, -1));
2882   g_free (normal);
2883 }
2884
2885 static gchar **
2886 split_words (const gchar *value)
2887 {
2888   const gchar *start = NULL;
2889   GPtrArray *result;
2890   const gchar *s;
2891
2892   result = g_ptr_array_new ();
2893
2894   for (s = value; *s; s = g_utf8_next_char (s))
2895     {
2896       gunichar c = g_utf8_get_char (s);
2897
2898       if (start == NULL)
2899         {
2900           if (g_unichar_isalnum (c) || g_unichar_ismark (c))
2901             start = s;
2902         }
2903       else
2904         {
2905           if (!g_unichar_isalnum (c) && !g_unichar_ismark (c))
2906             {
2907               index_add_folded (result, start, s);
2908               start = NULL;
2909             }
2910         }
2911     }
2912
2913   if (start)
2914     index_add_folded (result, start, s);
2915
2916   g_ptr_array_add (result, NULL);
2917
2918   return (gchar **) g_ptr_array_free (result, FALSE);
2919 }
2920
2921 /**
2922  * g_str_tokenize_and_fold:
2923  * @string: a string
2924  * @translit_locale: (allow-none): the language code (like 'de' or
2925  *   'en_GB') from which @string originates
2926  * @ascii_alternates: (out) (transfer full) (array zero-terminated=1): a
2927  *   return location for ASCII alternates
2928  *
2929  * Tokenises @string and performs folding on each token.
2930  *
2931  * A token is a non-empty sequence of alphanumeric characters in the
2932  * source string, separated by non-alphanumeric characters.  An
2933  * "alphanumeric" character for this purpose is one that matches
2934  * g_unichar_isalnum() or g_unichar_ismark().
2935  *
2936  * Each token is then (Unicode) normalised and case-folded.  If
2937  * @ascii_alternates is non-%NULL and some of the returned tokens
2938  * contain non-ASCII characters, ASCII alternatives will be generated.
2939  *
2940  * The number of ASCII alternatives that are generated and the method
2941  * for doing so is unspecified, but @translit_locale (if specified) may
2942  * improve the transliteration if the language of the source string is
2943  * known.
2944  *
2945  * Returns: (transfer full) (array zero-terminated=1): the folded tokens
2946  *
2947  * Since: 2.40
2948  **/
2949 gchar **
2950 g_str_tokenize_and_fold (const gchar   *string,
2951                          const gchar   *translit_locale,
2952                          gchar       ***ascii_alternates)
2953 {
2954   gchar **result;
2955
2956   g_return_val_if_fail (string != NULL, NULL);
2957
2958   if (ascii_alternates && g_str_is_ascii (string))
2959     {
2960       *ascii_alternates = g_new0 (gchar *, 0 + 1);
2961       ascii_alternates = NULL;
2962     }
2963
2964   result = split_words (string);
2965
2966   if (ascii_alternates)
2967     {
2968       gint i, j, n;
2969
2970       n = g_strv_length (result);
2971       *ascii_alternates = g_new (gchar *, n + 1);
2972       j = 0;
2973
2974       for (i = 0; i < n; i++)
2975         {
2976           if (!g_str_is_ascii (result[i]))
2977             {
2978               gchar *composed;
2979               gchar *ascii;
2980               gint k;
2981
2982               composed = g_utf8_normalize (result[i], -1, G_NORMALIZE_ALL_COMPOSE);
2983
2984               ascii = g_str_to_ascii (composed, translit_locale);
2985
2986               /* Only accept strings that are now entirely alnums */
2987               for (k = 0; ascii[k]; k++)
2988                 if (!g_ascii_isalnum (ascii[k]))
2989                   break;
2990
2991               if (ascii[k] == '\0')
2992                 /* Made it to the end... */
2993                 (*ascii_alternates)[j++] = ascii;
2994               else
2995                 g_free (ascii);
2996
2997               g_free (composed);
2998             }
2999         }
3000
3001       (*ascii_alternates)[j] = NULL;
3002     }
3003
3004   return result;
3005 }
3006
3007 /**
3008  * g_str_match_string:
3009  * @search_term: the search term from the user
3010  * @potential_hit: the text that may be a hit
3011  * @accept_alternates: %TRUE to accept ASCII alternates
3012  *
3013  * Checks if a search conducted for @search_term should match
3014  * @potential_hit.
3015  *
3016  * This function calls g_str_tokenize_and_fold() on both
3017  * @search_term and @potential_hit.  ASCII alternates are never taken
3018  * for @search_term but will be taken for @potential_hit according to
3019  * the value of @accept_alternates.
3020  *
3021  * A hit occurs when each folded token in @search_term is a prefix of a
3022  * folded token from @potential_hit.
3023  *
3024  * Depending on how you're performing the search, it will typically be
3025  * faster to call g_str_tokenize_and_fold() on each string in
3026  * your corpus and build an index on the returned folded tokens, then
3027  * call g_str_tokenize_and_fold() on the search term and
3028  * perform lookups into that index.
3029  *
3030  * As some examples, searching for "fred" would match the potential hit
3031  * "Smith, Fred" and also "Frédéric".  Searching for "Fréd" would match
3032  * "Frédéric" but not "Frederic" (due to the one-directional nature of
3033  * accent matching).  Searching "fo" would match "Foo" and "Bar Foo
3034  * Baz", but not "SFO" (because no word as "fo" as a prefix).
3035  *
3036  * Returns: %TRUE if @potential_hit is a hit
3037  *
3038  * Since: 2.40
3039  **/
3040 gboolean
3041 g_str_match_string (const gchar *search_term,
3042                     const gchar *potential_hit,
3043                     gboolean     accept_alternates)
3044 {
3045   gchar **alternates = NULL;
3046   gchar **term_tokens;
3047   gchar **hit_tokens;
3048   gboolean matched;
3049   gint i, j;
3050
3051   g_return_val_if_fail (search_term != NULL, FALSE);
3052   g_return_val_if_fail (potential_hit != NULL, FALSE);
3053
3054   term_tokens = g_str_tokenize_and_fold (search_term, NULL, NULL);
3055   hit_tokens = g_str_tokenize_and_fold (potential_hit, NULL, accept_alternates ? &alternates : NULL);
3056
3057   matched = TRUE;
3058
3059   for (i = 0; term_tokens[i]; i++)
3060     {
3061       for (j = 0; hit_tokens[j]; j++)
3062         if (g_str_has_prefix (hit_tokens[j], term_tokens[i]))
3063           goto one_matched;
3064
3065       if (accept_alternates)
3066         for (j = 0; alternates[j]; j++)
3067           if (g_str_has_prefix (alternates[j], term_tokens[i]))
3068             goto one_matched;
3069
3070       matched = FALSE;
3071       break;
3072
3073 one_matched:
3074       continue;
3075     }
3076
3077   g_strfreev (term_tokens);
3078   g_strfreev (hit_tokens);
3079   g_strfreev (alternates);
3080
3081   return matched;
3082 }
3083
3084 /**
3085  * g_strv_contains:
3086  * @strv: a %NULL-terminated array of strings
3087  * @str: a string
3088  *
3089  * Checks if @strv contains @str. @strv must not be %NULL.
3090  *
3091  * Returns: %TRUE if @str is an element of @strv, according to g_str_equal().
3092  *
3093  * Since: 2.44
3094  */
3095 gboolean
3096 g_strv_contains (const gchar * const *strv,
3097                  const gchar         *str)
3098 {
3099   g_return_val_if_fail (strv != NULL, FALSE);
3100   g_return_val_if_fail (str != NULL, FALSE);
3101
3102   for (; *strv != NULL; strv++)
3103     {
3104       if (g_str_equal (str, *strv))
3105         return TRUE;
3106     }
3107
3108   return FALSE;
3109 }