Patch-ID: bash41-010
[bash.git] / locale.c
blob2f2e9fc45bd7f10c38733c9c2787fd82770625e3
1 /* locale.c - Miscellaneous internationalization functions. */
3 /* Copyright (C) 1996-2009 Free Software Foundation, Inc.
5 This file is part of GNU Bash, the Bourne Again SHell.
7 Bash is free software: you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation, either version 3 of the License, or
10 (at your option) any later version.
12 Bash is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with Bash. If not, see <http://www.gnu.org/licenses/>.
21 #include "config.h"
23 #include "bashtypes.h"
25 #if defined (HAVE_UNISTD_H)
26 # include <unistd.h>
27 #endif
29 #include "bashintl.h"
30 #include "bashansi.h"
31 #include <stdio.h>
32 #include "chartypes.h"
33 #include <errno.h>
35 #include "shell.h"
36 #include "input.h" /* For bash_input */
38 #ifndef errno
39 extern int errno;
40 #endif
42 extern int dump_translatable_strings, dump_po_strings;
44 /* The current locale when the program begins */
45 static char *default_locale;
47 /* The current domain for textdomain(3). */
48 static char *default_domain;
49 static char *default_dir;
51 /* tracks the value of LC_ALL; used to override values for other locale
52 categories */
53 static char *lc_all;
55 /* tracks the value of LC_ALL; used to provide defaults for locale
56 categories */
57 static char *lang;
59 /* Called to reset all of the locale variables to their appropriate values
60 if (and only if) LC_ALL has not been assigned a value. */
61 static int reset_locale_vars __P((void));
63 static void locale_setblanks __P((void));
65 /* Set the value of default_locale and make the current locale the
66 system default locale. This should be called very early in main(). */
67 void
68 set_default_locale ()
70 #if defined (HAVE_SETLOCALE)
71 default_locale = setlocale (LC_ALL, "");
72 if (default_locale)
73 default_locale = savestring (default_locale);
74 #endif /* HAVE_SETLOCALE */
75 bindtextdomain (PACKAGE, LOCALEDIR);
76 textdomain (PACKAGE);
79 /* Set default values for LC_CTYPE, LC_COLLATE, LC_MESSAGES, LC_NUMERIC and
80 LC_TIME if they are not specified in the environment, but LC_ALL is. This
81 should be called from main() after parsing the environment. */
82 void
83 set_default_locale_vars ()
85 char *val;
87 #if defined (HAVE_SETLOCALE)
89 # if defined (LC_CTYPE)
90 val = get_string_value ("LC_CTYPE");
91 if (val == 0 && lc_all && *lc_all)
93 setlocale (LC_CTYPE, lc_all);
94 locale_setblanks ();
96 # endif
98 # if defined (LC_COLLATE)
99 val = get_string_value ("LC_COLLATE");
100 if (val == 0 && lc_all && *lc_all)
101 setlocale (LC_COLLATE, lc_all);
102 # endif /* LC_COLLATE */
104 # if defined (LC_MESSAGES)
105 val = get_string_value ("LC_MESSAGES");
106 if (val == 0 && lc_all && *lc_all)
107 setlocale (LC_MESSAGES, lc_all);
108 # endif /* LC_MESSAGES */
110 # if defined (LC_NUMERIC)
111 val = get_string_value ("LC_NUMERIC");
112 if (val == 0 && lc_all && *lc_all)
113 setlocale (LC_NUMERIC, lc_all);
114 # endif /* LC_NUMERIC */
116 # if defined (LC_TIME)
117 val = get_string_value ("LC_TIME");
118 if (val == 0 && lc_all && *lc_all)
119 setlocale (LC_TIME, lc_all);
120 # endif /* LC_TIME */
122 #endif /* HAVE_SETLOCALE */
124 val = get_string_value ("TEXTDOMAIN");
125 if (val && *val)
127 FREE (default_domain);
128 default_domain = savestring (val);
129 #if 0
130 /* Don't want to override the shell's textdomain as the default */
131 textdomain (default_domain);
132 #endif
135 val = get_string_value ("TEXTDOMAINDIR");
136 if (val && *val)
138 FREE (default_dir);
139 default_dir = savestring (val);
140 if (default_domain && *default_domain)
141 bindtextdomain (default_domain, default_dir);
145 /* Set one of the locale categories (specified by VAR) to VALUE. Returns 1
146 if successful, 0 otherwise. */
148 set_locale_var (var, value)
149 char *var, *value;
151 int r;
152 char *x;
154 x = "";
155 errno = 0;
156 if (var[0] == 'T' && var[10] == 0) /* TEXTDOMAIN */
158 FREE (default_domain);
159 default_domain = value ? savestring (value) : (char *)NULL;
160 #if 0
161 /* Don't want to override the shell's textdomain as the default */
162 textdomain (default_domain);
163 #endif
164 return (1);
166 else if (var[0] == 'T') /* TEXTDOMAINDIR */
168 FREE (default_dir);
169 default_dir = value ? savestring (value) : (char *)NULL;
170 if (default_domain && *default_domain)
171 bindtextdomain (default_domain, default_dir);
172 return (1);
175 /* var[0] == 'L' && var[1] == 'C' && var[2] == '_' */
177 else if (var[3] == 'A') /* LC_ALL */
179 FREE (lc_all);
180 if (value)
181 lc_all = savestring (value);
182 else
184 lc_all = (char *)xmalloc (1);
185 lc_all[0] = '\0';
187 #if defined (HAVE_SETLOCALE)
188 r = *lc_all ? ((x = setlocale (LC_ALL, lc_all)) != 0) : reset_locale_vars ();
189 if (x == 0)
191 if (errno == 0)
192 internal_warning(_("setlocale: LC_ALL: cannot change locale (%s)"), lc_all);
193 else
194 internal_warning(_("setlocale: LC_ALL: cannot change locale (%s): %s"), lc_all, strerror (errno));
196 locale_setblanks ();
197 return r;
198 #else
199 return (1);
200 #endif
203 #if defined (HAVE_SETLOCALE)
204 else if (var[3] == 'C' && var[4] == 'T') /* LC_CTYPE */
206 # if defined (LC_CTYPE)
207 if (lc_all == 0 || *lc_all == '\0')
209 x = setlocale (LC_CTYPE, get_locale_var ("LC_CTYPE"));
210 locale_setblanks ();
212 # endif
214 else if (var[3] == 'C' && var[4] == 'O') /* LC_COLLATE */
216 # if defined (LC_COLLATE)
217 if (lc_all == 0 || *lc_all == '\0')
218 x = setlocale (LC_COLLATE, get_locale_var ("LC_COLLATE"));
219 # endif /* LC_COLLATE */
221 else if (var[3] == 'M' && var[4] == 'E') /* LC_MESSAGES */
223 # if defined (LC_MESSAGES)
224 if (lc_all == 0 || *lc_all == '\0')
225 x = setlocale (LC_MESSAGES, get_locale_var ("LC_MESSAGES"));
226 # endif /* LC_MESSAGES */
228 else if (var[3] == 'N' && var[4] == 'U') /* LC_NUMERIC */
230 # if defined (LC_NUMERIC)
231 if (lc_all == 0 || *lc_all == '\0')
232 x = setlocale (LC_NUMERIC, get_locale_var ("LC_NUMERIC"));
233 # endif /* LC_NUMERIC */
235 else if (var[3] == 'T' && var[4] == 'I') /* LC_TIME */
237 # if defined (LC_TIME)
238 if (lc_all == 0 || *lc_all == '\0')
239 x = setlocale (LC_TIME, get_locale_var ("LC_TIME"));
240 # endif /* LC_TIME */
242 #endif /* HAVE_SETLOCALE */
244 if (x == 0)
246 if (errno == 0)
247 internal_warning(_("setlocale: %s: cannot change locale (%s)"), var, get_locale_var (var));
248 else
249 internal_warning(_("setlocale: %s: cannot change locale (%s): %s"), var, get_locale_var (var), strerror (errno));
252 return (x != 0);
255 /* Called when LANG is assigned a value. Tracks value in `lang'. Calls
256 reset_locale_vars() to reset any default values if LC_ALL is unset or
257 null. */
259 set_lang (var, value)
260 char *var, *value;
262 FREE (lang);
263 if (value)
264 lang = savestring (value);
265 else
267 lang = (char *)xmalloc (1);
268 lang[0] = '\0';
271 return ((lc_all == 0 || *lc_all == 0) ? reset_locale_vars () : 0);
274 /* Set default values for LANG and LC_ALL. Default values for all other
275 locale-related variables depend on these. */
276 void
277 set_default_lang ()
279 char *v;
281 v = get_string_value ("LC_ALL");
282 set_locale_var ("LC_ALL", v);
284 v = get_string_value ("LANG");
285 set_lang ("LANG", v);
288 /* Get the value of one of the locale variables (LC_MESSAGES, LC_CTYPE).
289 The precedence is as POSIX.2 specifies: LC_ALL has precedence over
290 the specific locale variables, and LANG, if set, is used as the default. */
291 char *
292 get_locale_var (var)
293 char *var;
295 char *locale;
297 locale = lc_all;
299 if (locale == 0 || *locale == 0)
300 locale = get_string_value (var);
301 if (locale == 0 || *locale == 0)
302 locale = lang;
303 if (locale == 0 || *locale == 0)
304 #if 0
305 locale = default_locale; /* system-dependent; not really portable. should it be "C"? */
306 #else
307 locale = "";
308 #endif
309 return (locale);
312 /* Called to reset all of the locale variables to their appropriate values
313 if (and only if) LC_ALL has not been assigned a value. DO NOT CALL THIS
314 IF LC_ALL HAS BEEN ASSIGNED A VALUE. */
315 static int
316 reset_locale_vars ()
318 char *t;
319 #if defined (HAVE_SETLOCALE)
320 if (lang == 0 || *lang == '\0')
321 maybe_make_export_env (); /* trust that this will change environment for setlocale */
322 if (setlocale (LC_ALL, lang ? lang : "") == 0)
323 return 0;
325 # if defined (LC_CTYPE)
326 t = setlocale (LC_CTYPE, get_locale_var ("LC_CTYPE"));
327 # endif
328 # if defined (LC_COLLATE)
329 t = setlocale (LC_COLLATE, get_locale_var ("LC_COLLATE"));
330 # endif
331 # if defined (LC_MESSAGES)
332 t = setlocale (LC_MESSAGES, get_locale_var ("LC_MESSAGES"));
333 # endif
334 # if defined (LC_NUMERIC)
335 t = setlocale (LC_NUMERIC, get_locale_var ("LC_NUMERIC"));
336 # endif
337 # if defined (LC_TIME)
338 t = setlocale (LC_TIME, get_locale_var ("LC_TIME"));
339 # endif
341 locale_setblanks ();
343 #endif
344 return 1;
347 /* Translate the contents of STRING, a $"..." quoted string, according
348 to the current locale. In the `C' or `POSIX' locale, or if gettext()
349 is not available, the passed string is returned unchanged. The
350 length of the translated string is returned in LENP, if non-null. */
351 char *
352 localetrans (string, len, lenp)
353 char *string;
354 int len, *lenp;
356 char *locale, *t;
357 char *translated;
358 int tlen;
360 /* Don't try to translate null strings. */
361 if (string == 0 || *string == 0)
363 if (lenp)
364 *lenp = 0;
365 return ((char *)NULL);
368 locale = get_locale_var ("LC_MESSAGES");
370 /* If we don't have setlocale() or the current locale is `C' or `POSIX',
371 just return the string. If we don't have gettext(), there's no use
372 doing anything else. */
373 if (locale == 0 || locale[0] == '\0' ||
374 (locale[0] == 'C' && locale[1] == '\0') || STREQ (locale, "POSIX"))
376 t = (char *)xmalloc (len + 1);
377 strcpy (t, string);
378 if (lenp)
379 *lenp = len;
380 return (t);
383 /* Now try to translate it. */
384 if (default_domain && *default_domain)
385 translated = dgettext (default_domain, string);
386 else
387 translated = string;
389 if (translated == string) /* gettext returns its argument if untranslatable */
391 t = (char *)xmalloc (len + 1);
392 strcpy (t, string);
393 if (lenp)
394 *lenp = len;
396 else
398 tlen = strlen (translated);
399 t = (char *)xmalloc (tlen + 1);
400 strcpy (t, translated);
401 if (lenp)
402 *lenp = tlen;
404 return (t);
407 /* Change a bash string into a string suitable for inclusion in a `po' file.
408 This backslash-escapes `"' and `\' and changes newlines into \\\n"\n". */
409 char *
410 mk_msgstr (string, foundnlp)
411 char *string;
412 int *foundnlp;
414 register int c, len;
415 char *result, *r, *s;
417 for (len = 0, s = string; s && *s; s++)
419 len++;
420 if (*s == '"' || *s == '\\')
421 len++;
422 else if (*s == '\n')
423 len += 5;
426 r = result = (char *)xmalloc (len + 3);
427 *r++ = '"';
429 for (s = string; s && (c = *s); s++)
431 if (c == '\n') /* <NL> -> \n"<NL>" */
433 *r++ = '\\';
434 *r++ = 'n';
435 *r++ = '"';
436 *r++ = '\n';
437 *r++ = '"';
438 if (foundnlp)
439 *foundnlp = 1;
440 continue;
442 if (c == '"' || c == '\\')
443 *r++ = '\\';
444 *r++ = c;
447 *r++ = '"';
448 *r++ = '\0';
450 return result;
453 /* $"..." -- Translate the portion of STRING between START and END
454 according to current locale using gettext (if available) and return
455 the result. The caller will take care of leaving the quotes intact.
456 The string will be left without the leading `$' by the caller.
457 If translation is performed, the translated string will be double-quoted
458 by the caller. The length of the translated string is returned in LENP,
459 if non-null. */
460 char *
461 localeexpand (string, start, end, lineno, lenp)
462 char *string;
463 int start, end, lineno, *lenp;
465 int len, tlen, foundnl;
466 char *temp, *t, *t2;
468 temp = (char *)xmalloc (end - start + 1);
469 for (tlen = 0, len = start; len < end; )
470 temp[tlen++] = string[len++];
471 temp[tlen] = '\0';
473 /* If we're just dumping translatable strings, don't do anything with the
474 string itself, but if we're dumping in `po' file format, convert it into
475 a form more palatable to gettext(3) and friends by quoting `"' and `\'
476 with backslashes and converting <NL> into `\n"<NL>"'. If we find a
477 newline in TEMP, we first output a `msgid ""' line and then the
478 translated string; otherwise we output the `msgid' and translated
479 string all on one line. */
480 if (dump_translatable_strings)
482 if (dump_po_strings)
484 foundnl = 0;
485 t = mk_msgstr (temp, &foundnl);
486 t2 = foundnl ? "\"\"\n" : "";
488 printf ("#: %s:%d\nmsgid %s%s\nmsgstr \"\"\n",
489 yy_input_name (), lineno, t2, t);
490 free (t);
492 else
493 printf ("\"%s\"\n", temp);
495 if (lenp)
496 *lenp = tlen;
497 return (temp);
499 else if (*temp)
501 t = localetrans (temp, tlen, &len);
502 free (temp);
503 if (lenp)
504 *lenp = len;
505 return (t);
507 else
509 if (lenp)
510 *lenp = 0;
511 return (temp);
515 /* Set every character in the <blank> character class to be a shell break
516 character for the lexical analyzer when the locale changes. */
517 static void
518 locale_setblanks ()
520 int x;
522 for (x = 0; x < sh_syntabsiz; x++)
524 if (isblank (x))
525 sh_syntaxtab[x] |= CSHBRK|CBLANK;
526 else if (member (x, shell_break_chars))
528 sh_syntaxtab[x] |= CSHBRK;
529 sh_syntaxtab[x] &= ~CBLANK;
531 else
532 sh_syntaxtab[x] &= ~(CSHBRK|CBLANK);