2 * Copyright © 2003, 2004 Christian Persch
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2, or (at your option)
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
23 #include "ephy-langs.h"
25 #include "ephy-debug.h"
27 #include <glib/gi18n.h>
31 #include <libxml/xmlreader.h>
33 /* If you add more language codes here, remember to also
34 * add them to data/generate-font-schemas.py .
36 static const EphyFontsLanguageInfo font_languages [] =
38 /* Translators: The text before the "|" is context to help you decide on
39 * the correct translation. You MUST OMIT it in the translated string. */
40 { N_("select fonts for|Arabic"), "ar" },
41 /* Translators: The text before the "|" is context to help you decide on
42 * the correct translation. You MUST OMIT it in the translated string. */
43 { N_("select fonts for|Baltic"), "x-baltic" },
44 /* Translators: The text before the "|" is context to help you decide on
45 * the correct translation. You MUST OMIT it in the translated string. */
46 { N_("select fonts for|Central European"), "x-central-euro" },
47 /* Translators: The text before the "|" is context to help you decide on
48 * the correct translation. You MUST OMIT it in the translated string. */
49 { N_("select fonts for|Cyrillic"), "x-cyrillic" },
50 /* Translators: The text before the "|" is context to help you decide on
51 * the correct translation. You MUST OMIT it in the translated string. */
52 { N_("select fonts for|Devanagari"), "x-devanagari" },
53 /* Translators: The text before the "|" is context to help you decide on
54 * the correct translation. You MUST OMIT it in the translated string. */
55 { N_("select fonts for|Greek"), "el" },
56 /* Translators: The text before the "|" is context to help you decide on
57 * the correct translation. You MUST OMIT it in the translated string. */
58 { N_("select fonts for|Hebrew"), "he" },
59 /* Translators: The text before the "|" is context to help you decide on
60 * the correct translation. You MUST OMIT it in the translated string. */
61 { N_("select fonts for|Japanese"), "ja" },
62 /* Translators: The text before the "|" is context to help you decide on
63 * the correct translation. You MUST OMIT it in the translated string. */
64 { N_("select fonts for|Korean"), "ko" },
65 /* Translators: The text before the "|" is context to help you decide on
66 * the correct translation. You MUST OMIT it in the translated string. */
67 { N_("select fonts for|Simplified Chinese"), "zh-CN" },
68 /* Translators: The text before the "|" is context to help you decide on
69 * the correct translation. You MUST OMIT it in the translated string. */
70 { N_("select fonts for|Tamil"), "x-tamil" },
71 /* Translators: The text before the "|" is context to help you decide on
72 * the correct translation. You MUST OMIT it in the translated string. */
73 { N_("select fonts for|Thai"), "th" },
74 /* Translators: The text before the "|" is context to help you decide on
75 * the correct translation. You MUST OMIT it in the translated string. */
76 { N_("select fonts for|Traditional Chinese"), "zh-TW" },
77 /* Translators: The text before the "|" is context to help you decide on
78 * the correct translation. You MUST OMIT it in the translated string. */
79 { N_("select fonts for|Traditional Chinese (Hong Kong)"), "zh-HK" },
80 /* Translators: The text before the "|" is context to help you decide on
81 * the correct translation. You MUST OMIT it in the translated string. */
82 { N_("select fonts for|Turkish"), "tr" },
83 /* Translators: The text before the "|" is context to help you decide on
84 * the correct translation. You MUST OMIT it in the translated string. */
85 { N_("select fonts for|Armenian"), "x-armn" },
86 /* Translators: The text before the "|" is context to help you decide on
87 * the correct translation. You MUST OMIT it in the translated string. */
88 { N_("select fonts for|Bengali"), "x-beng" },
89 /* Translators: The text before the "|" is context to help you decide on
90 * the correct translation. You MUST OMIT it in the translated string. */
91 { N_("select fonts for|Unified Canadian Syllabics"), "x-cans" },
92 /* Translators: The text before the "|" is context to help you decide on
93 * the correct translation. You MUST OMIT it in the translated string. */
94 { N_("select fonts for|Ethiopic"), "x-ethi" },
95 /* Translators: The text before the "|" is context to help you decide on
96 * the correct translation. You MUST OMIT it in the translated string. */
97 { N_("select fonts for|Georgian"), "x-geor" },
98 /* Translators: The text before the "|" is context to help you decide on
99 * the correct translation. You MUST OMIT it in the translated string. */
100 { N_("select fonts for|Gujarati"), "x-gujr" },
101 /* Translators: The text before the "|" is context to help you decide on
102 * the correct translation. You MUST OMIT it in the translated string. */
103 { N_("select fonts for|Gurmukhi"), "x-guru" },
104 /* Translators: The text before the "|" is context to help you decide on
105 * the correct translation. You MUST OMIT it in the translated string. */
106 { N_("select fonts for|Khmer"), "x-khmr" },
107 /* Translators: The text before the "|" is context to help you decide on
108 * the correct translation. You MUST OMIT it in the translated string. */
109 { N_("select fonts for|Malayalam"), "x-mlym" },
110 /* Translators: The text before the "|" is context to help you decide on
111 * the correct translation. You MUST OMIT it in the translated string. */
112 { N_("select fonts for|Western"), "x-western" },
113 /* Translators: The text before the "|" is context to help you decide on
114 * the correct translation. You MUST OMIT it in the translated string. */
115 { N_("select fonts for|Other Scripts"), "x-unicode" }
118 const EphyFontsLanguageInfo *
119 ephy_font_languages (void)
121 return font_languages;
125 ephy_font_n_languages (void)
127 return G_N_ELEMENTS (font_languages);
130 /* sanitise the languages list according to the rules for HTTP accept-language
131 * in RFC 2616, Sect. 14.4
134 ephy_langs_sanitise (GArray *array)
139 /* if we have 'xy-ab' in list but not 'xy', append 'xy' */
140 for (i = 0; i < array->len; i++)
142 gboolean found = FALSE;
145 lang1 = (char *) g_array_index (array,char *, i);
147 dash = strchr (lang1, '-');
148 if (dash == NULL) continue;
150 for (j = i + 1; j < array->len; j++)
152 lang2 = (char *) g_array_index (array, char *, j);
153 if (strchr (lang2, '-') == NULL &&
154 g_str_has_prefix (lang1, lang2))
162 prefix = g_strndup (lang1, dash - lang1);
163 g_array_append_val (array, prefix);
168 for (i = 0; i < (int) array->len - 1; i++)
170 for (j = (int) array->len - 1; j > i; j--)
172 lang1 = (char *) g_array_index (array,char *, i);
173 lang2 = (char *) g_array_index (array, char *, j);
175 if (strcmp (lang1, lang2) == 0)
177 g_array_remove_index (array, j);
183 /* move 'xy' code behind all 'xy-ab' codes */
184 for (i = (int) array->len - 2; i >= 0; i--)
186 for (j = (int) array->len - 1; j > i; j--)
188 lang1 = (char *) g_array_index (array, char *, i);
189 lang2 = (char *) g_array_index (array, char *, j);
191 if (strchr (lang1, '-') == NULL &&
192 strchr (lang2, '-') != NULL &&
193 g_str_has_prefix (lang2, lang1))
195 g_array_insert_val (array, j + 1, lang1);
196 g_array_remove_index (array, i);
204 ephy_langs_append_languages (GArray *array)
206 const char * const * languages;
210 languages = g_get_language_names ();
211 g_return_if_fail (languages != NULL);
213 /* FIXME: maybe just use the first, instead of all of them? */
214 for (i = 0; languages[i] != NULL; i++)
217 if (strstr (languages[i], ".") == 0 &&
218 strstr (languages[i], "@") == 0 &&
219 strcmp (languages[i], "C") != 0)
221 /* change to lowercase and '_' to '-' */
222 lang = g_strdelimit (g_ascii_strdown
223 (languages[i], -1), "_", '-');
225 g_array_append_val (array, lang);
229 /* Fallback: add "en" if list is empty */
232 lang = g_strdup ("en");
233 g_array_append_val (array, lang);
238 ephy_langs_get_languages (void)
242 array = g_array_new (TRUE, FALSE, sizeof (char *));
244 ephy_langs_append_languages (array);
246 ephy_langs_sanitise (array);
248 return (char **) g_array_free (array, FALSE);
251 #define ISOCODESLOCALEDIR ISO_CODES_PREFIX "/share/locale"
254 ephy_langs_bind_iso_domains (void)
257 static gboolean bound = FALSE;
261 bindtextdomain (ISO_639_DOMAIN, ISOCODESLOCALEDIR);
262 bind_textdomain_codeset (ISO_639_DOMAIN, "UTF-8");
264 bindtextdomain(ISO_3166_DOMAIN, ISOCODESLOCALEDIR);
265 bind_textdomain_codeset (ISO_3166_DOMAIN, "UTF-8");
273 read_iso_639_entry (xmlTextReaderPtr reader,
276 xmlChar *code, *name;
278 code = xmlTextReaderGetAttribute (reader, (const xmlChar *) "iso_639_1_code");
279 name = xmlTextReaderGetAttribute (reader, (const xmlChar *) "name");
281 /* Get iso-639-2 code */
282 if (code == NULL || code[0] == '\0')
285 /* FIXME: use the 2T or 2B code? */
286 code = xmlTextReaderGetAttribute (reader, (const xmlChar *) "iso_639_2T_code");
289 if (code != NULL && code[0] != '\0' && name != NULL && name[0] != '\0')
291 g_hash_table_insert (table, code, name);
301 read_iso_3166_entry (xmlTextReaderPtr reader,
304 xmlChar *code, *name;
306 code = xmlTextReaderGetAttribute (reader, (const xmlChar *) "alpha_2_code");
307 name = xmlTextReaderGetAttribute (reader, (const xmlChar *) "name");
309 if (code != NULL && code[0] != '\0' && name != NULL && name[0] != '\0')
313 lcode = g_ascii_strdown ((char *) code, -1);
316 g_hash_table_insert (table, lcode, name);
334 load_iso_entries (int iso,
335 GFunc read_entry_func,
338 xmlTextReaderPtr reader;
339 ParserState state = STATE_START;
340 xmlChar iso_entries[32], iso_entry[32];
344 LOG ("Loading ISO-%d codes", iso);
346 START_PROFILER ("Loading ISO codes")
348 filename = g_strdup_printf (ISO_CODES_PREFIX "/share/xml/iso-codes/iso_%d.xml", iso);
349 reader = xmlNewTextReaderFilename (filename);
350 if (reader == NULL) goto out;
352 xmlStrPrintf (iso_entries, sizeof (iso_entries), (const xmlChar *)"iso_%d_entries", iso);
353 xmlStrPrintf (iso_entry, sizeof (iso_entry), (const xmlChar *)"iso_%d_entry", iso);
355 ret = xmlTextReaderRead (reader);
362 tag = xmlTextReaderConstName (reader);
363 type = xmlTextReaderNodeType (reader);
365 if (state == STATE_ENTRIES &&
366 type == XML_READER_TYPE_ELEMENT &&
367 xmlStrEqual (tag, iso_entry))
369 read_entry_func (reader, user_data);
371 else if (state == STATE_START &&
372 type == XML_READER_TYPE_ELEMENT &&
373 xmlStrEqual (tag, iso_entries))
375 state = STATE_ENTRIES;
377 else if (state == STATE_ENTRIES &&
378 type == XML_READER_TYPE_END_ELEMENT &&
379 xmlStrEqual (tag, iso_entries))
383 else if (type == XML_READER_TYPE_SIGNIFICANT_WHITESPACE ||
384 type == XML_READER_TYPE_WHITESPACE ||
385 type == XML_READER_TYPE_TEXT ||
386 type == XML_READER_TYPE_COMMENT)
395 ret = xmlTextReaderRead (reader);
398 xmlFreeTextReader (reader);
401 if (ret < 0 || state != STATE_STOP)
403 g_warning ("Failed to load ISO-%d codes from %s!\n",
409 STOP_PROFILER ("Loading ISO codes")
413 ephy_langs_iso_639_table (void)
417 ephy_langs_bind_iso_domains ();
418 table = g_hash_table_new_full (g_str_hash, g_str_equal,
419 (GDestroyNotify) xmlFree,
420 (GDestroyNotify) xmlFree);
422 load_iso_entries (639, (GFunc) read_iso_639_entry, table);
428 ephy_langs_iso_3166_table (void)
432 ephy_langs_bind_iso_domains ();
433 table = g_hash_table_new_full (g_str_hash, g_str_equal,
434 (GDestroyNotify) g_free,
435 (GDestroyNotify) xmlFree);
437 load_iso_entries (3166, (GFunc) read_iso_3166_entry, table);