diff options
Diffstat (limited to 'app/widgets/gimplanguagestore-parser.c')
-rw-r--r-- | app/widgets/gimplanguagestore-parser.c | 519 |
1 files changed, 519 insertions, 0 deletions
diff --git a/app/widgets/gimplanguagestore-parser.c b/app/widgets/gimplanguagestore-parser.c new file mode 100644 index 0000000..d667a7a --- /dev/null +++ b/app/widgets/gimplanguagestore-parser.c @@ -0,0 +1,519 @@ +/* GIMP - The GNU Image Manipulation Program + * Copyright (C) 1995 Spencer Kimball and Peter Mattis + * + * gimplanguagestore-parser.c + * Copyright (C) 2008, 2009 Sven Neumann <sven@gimp.org> + * Copyright (C) 2013 Jehan <jehan at girinstud.io> + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 3 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program. If not, see <https://www.gnu.org/licenses/>. + */ + +#include "config.h" + +#include <locale.h> +#include <string.h> + +#include <gtk/gtk.h> + +#include "libgimpbase/gimpbase.h" + +#include "widgets-types.h" + +#include "config/gimpxmlparser.h" + +#include "gimplanguagestore.h" +#include "gimplanguagestore-parser.h" + +#include "gimp-intl.h" + + +typedef enum +{ + ISO_CODES_START, + ISO_CODES_IN_ENTRIES, + ISO_CODES_IN_ENTRY, + ISO_CODES_IN_UNKNOWN +} IsoCodesParserState; + +typedef struct +{ + IsoCodesParserState state; + IsoCodesParserState last_known_state; + gint unknown_depth; + GHashTable *base_lang_list; +} IsoCodesParser; + + +static gboolean parse_iso_codes (GHashTable *base_lang_list, + GError **error); + +#ifdef HAVE_ISO_CODES +static void iso_codes_parser_init (void); +static void iso_codes_parser_start_element (GMarkupParseContext *context, + const gchar *element_name, + const gchar **attribute_names, + const gchar **attribute_values, + gpointer user_data, + GError **error); +static void iso_codes_parser_end_element (GMarkupParseContext *context, + const gchar *element_name, + gpointer user_data, + GError **error); + +static void iso_codes_parser_start_unknown (IsoCodesParser *parser); +static void iso_codes_parser_end_unknown (IsoCodesParser *parser); +#endif /* HAVE_ISO_CODES */ + +/* + * Language lists that we want to generate only once at program startup: + * @l10n_lang_list: all available localizations self-localized; + * @all_lang_list: all known languages, in the user-selected language. + */ +static GHashTable *l10n_lang_list = NULL; +static GHashTable *all_lang_list = NULL; + +/********************\ + * Public Functions * +\********************/ + +/* + * Initialize and run the language listing parser. This call must be + * made only once, at program initialization, but after language_init(). + */ +void +gimp_language_store_parser_init (void) +{ + GHashTable *base_lang_list; + gchar *current_env; + GDir *locales_dir; + GError *error = NULL; + GHashTableIter lang_iter; + gpointer key; + + if (l10n_lang_list != NULL) + { + g_warning ("gimp_language_store_parser_init() must be run only once."); + return; + } + + current_env = g_strdup (g_getenv ("LANGUAGE")); + + l10n_lang_list = g_hash_table_new_full (g_str_hash, g_str_equal, + (GDestroyNotify) g_free, + (GDestroyNotify) g_free); + all_lang_list = g_hash_table_new_full (g_str_hash, g_str_equal, + (GDestroyNotify) g_free, + (GDestroyNotify) g_free); + base_lang_list = g_hash_table_new_full (g_str_hash, g_str_equal, + (GDestroyNotify) g_free, + (GDestroyNotify) g_free); + + /* Check all locales we have translations for. */ + locales_dir = g_dir_open (gimp_locale_directory (), 0, NULL); + if (locales_dir) + { + const gchar *locale; + + while ((locale = g_dir_read_name (locales_dir)) != NULL) + { + gchar *filename = g_build_filename (gimp_locale_directory (), + locale, + "LC_MESSAGES", + GETTEXT_PACKAGE ".mo", + NULL); + if (g_file_test (filename, G_FILE_TEST_EXISTS)) + { + gchar *delimiter = NULL; + gchar *base_code = NULL; + + delimiter = strchr (locale, '_'); + + if (delimiter) + base_code = g_strndup (locale, delimiter - locale); + else + base_code = g_strdup (locale); + + delimiter = strchr (base_code, '@'); + + if (delimiter) + { + gchar *temp = base_code; + base_code = g_strndup (base_code, delimiter - base_code); + g_free (temp); + } + + /* Save the full language code. */ + g_hash_table_insert (l10n_lang_list, g_strdup (locale), NULL); + /* Save the base language code. */ + g_hash_table_insert (base_lang_list, base_code, NULL); + } + + g_free (filename); + } + + g_dir_close (locales_dir); + } + + /* Parse ISO-639 file to get full list of language and their names. */ + parse_iso_codes (base_lang_list, &error); + + /* Generate the localized language names. */ + g_hash_table_iter_init (&lang_iter, l10n_lang_list); + while (g_hash_table_iter_next (&lang_iter, &key, NULL)) + { + gchar *code = (gchar*) key; + gchar *localized_name = NULL; + gchar *english_name = NULL; + gchar *delimiter = NULL; + gchar *base_code = NULL; + + delimiter = strchr (code, '_'); + + if (delimiter) + base_code = g_strndup (code, delimiter - code); + else + base_code = g_strdup (code); + + delimiter = strchr (base_code, '@'); + + if (delimiter) + { + gchar *temp = base_code; + base_code = g_strndup (base_code, delimiter - base_code); + g_free (temp); + } + + english_name = (gchar*) (g_hash_table_lookup (base_lang_list, base_code)); + + if (english_name) + { + gchar *semicolon; + + /* If possible, we want to localize a language in itself. + * If it fails, gettext fallbacks to C (en_US) itself. + */ + g_setenv ("LANGUAGE", code, TRUE); + setlocale (LC_ALL, ""); + + localized_name = g_strdup (dgettext ("iso_639", english_name)); + + /* If original and localized names are the same for other than English, + * maybe localization failed. Try now in the main dialect. */ + if (g_strcmp0 (english_name, localized_name) == 0 && + g_strcmp0 (base_code, "en") != 0 && + g_strcmp0 (code, base_code) != 0) + { + g_free (localized_name); + + g_setenv ("LANGUAGE", base_code, TRUE); + setlocale (LC_ALL, ""); + + localized_name = g_strdup (dgettext ("iso_639", english_name)); + } + + /* there might be several language names; use the first one */ + semicolon = strchr (localized_name, ';'); + + if (semicolon) + { + gchar *temp = localized_name; + localized_name = g_strndup (localized_name, semicolon - localized_name); + g_free (temp); + } + } + + g_hash_table_replace (l10n_lang_list, g_strdup(code), + g_strdup_printf ("%s [%s]", + localized_name ? + localized_name : "???", + code)); + g_free (localized_name); + g_free (base_code); + } + + /* Add special entries for system locale. + * We want the system locale to be localized in itself. */ + g_setenv ("LANGUAGE", setlocale (LC_ALL, NULL), TRUE); + setlocale (LC_ALL, ""); + + /* g_str_hash() does not accept NULL. I give an empty code instead. + * Other solution would to create a custom hash. */ + g_hash_table_insert (l10n_lang_list, g_strdup(""), + g_strdup (_("System Language"))); + + /* Go back to original localization. */ + if (current_env) + { + g_setenv ("LANGUAGE", current_env, TRUE); + g_free (current_env); + } + else + g_unsetenv ("LANGUAGE"); + setlocale (LC_ALL, ""); + + /* Add special entry for C (en_US). */ + g_hash_table_insert (l10n_lang_list, g_strdup ("en_US"), + g_strdup ("English [en_US]")); + + g_hash_table_destroy (base_lang_list); +} + +void +gimp_language_store_parser_clean (void) +{ + g_hash_table_destroy (l10n_lang_list); + g_hash_table_destroy (all_lang_list); +} + +/* + * Returns a Hash table of languages. + * Keys and values are respectively language codes and names from the + * ISO-639 standard code. + * + * If @localization_only is TRUE, it returns only the list of available + * GIMP localizations, and language names are translated in their own + * locale. + * If @localization_only is FALSE, the full list of ISO-639 languages + * is returned, and language names are in the user-set locale. + * + * Do not free the list or elements of the list. + */ +GHashTable * +gimp_language_store_parser_get_languages (gboolean localization_only) +{ + if (localization_only) + return l10n_lang_list; + else + return all_lang_list; +} + +/*****************************\ + * Private Parsing Functions * +\*****************************/ + +/* + * Parse the ISO-639 code list if available on this system, and fill + * @base_lang_list with English names of all needed base codes. + * + * It will also fill the static @all_lang_list. + */ +static gboolean +parse_iso_codes (GHashTable *base_lang_list, + GError **error) +{ + gboolean success = TRUE; + +#ifdef HAVE_ISO_CODES + static const GMarkupParser markup_parser = + { + iso_codes_parser_start_element, + iso_codes_parser_end_element, + NULL, /* characters */ + NULL, /* passthrough */ + NULL /* error */ + }; + + GimpXmlParser *xml_parser; + GFile *file; + IsoCodesParser parser = { 0, }; + + g_return_val_if_fail (error == NULL || *error == NULL, FALSE); + + iso_codes_parser_init (); + + parser.base_lang_list = g_hash_table_ref (base_lang_list); + + xml_parser = gimp_xml_parser_new (&markup_parser, &parser); + +#if ENABLE_RELOCATABLE_RESOURCES + file = gimp_installation_directory_file ("share", "xml", "iso-codes", + "iso_639.xml", NULL); +#else + file = g_file_new_for_path (ISO_CODES_LOCATION G_DIR_SEPARATOR_S + "iso_639.xml"); +#endif + + success = gimp_xml_parser_parse_gfile (xml_parser, file, error); + if (error && *error) + { + g_warning ("%s: error parsing '%s': %s\n", + G_STRFUNC, g_file_get_path (file), + (*error)->message); + g_clear_error (error); + } + + g_object_unref (file); + + gimp_xml_parser_free (xml_parser); + g_hash_table_unref (parser.base_lang_list); + +#endif /* HAVE_ISO_CODES */ + + return success; +} + +#ifdef HAVE_ISO_CODES +static void +iso_codes_parser_init (void) +{ + static gboolean initialized = FALSE; + + if (initialized) + return; + +#ifdef G_OS_WIN32 + /* on Win32, assume iso-codes is installed in the same location as GIMP */ + bindtextdomain ("iso_639", gimp_locale_directory ()); +#else + bindtextdomain ("iso_639", ISO_CODES_LOCALEDIR); +#endif + + bind_textdomain_codeset ("iso_639", "UTF-8"); + + initialized = TRUE; +} + +static void +iso_codes_parser_entry (IsoCodesParser *parser, + const gchar **names, + const gchar **values) +{ + const gchar *lang = NULL; + const gchar *code = NULL; + + while (*names && *values) + { + if (strcmp (*names, "name") == 0) + lang = *values; + else if (strcmp (*names, "iso_639_2B_code") == 0 && code == NULL) + /* 2-letter ISO 639-1 codes have priority. + * But some languages have no 2-letter code. Ex: Asturian (ast). + */ + code = *values; + else if (strcmp (*names, "iso_639_2T_code") == 0 && code == NULL) + code = *values; + else if (strcmp (*names, "iso_639_1_code") == 0) + code = *values; + + names++; + values++; + } + + if (lang && *lang && code && *code) + { + gchar *semicolon; + gchar *localized_name = g_strdup (dgettext ("iso_639", lang)); + + /* If the language is in our base table, we save its standard English name. */ + if (g_hash_table_contains (parser->base_lang_list, code)) + g_hash_table_replace (parser->base_lang_list, g_strdup (code), g_strdup (lang)); + + /* there might be several language names; use the first one */ + semicolon = strchr (localized_name, ';'); + + if (semicolon) + { + gchar *temp = localized_name; + localized_name = g_strndup (localized_name, semicolon - localized_name); + g_free (temp); + } + /* In any case, we save the name in user-set language for all lang. */ + g_hash_table_insert (all_lang_list, g_strdup (code), localized_name); + } +} + +static void +iso_codes_parser_start_element (GMarkupParseContext *context, + const gchar *element_name, + const gchar **attribute_names, + const gchar **attribute_values, + gpointer user_data, + GError **error) +{ + IsoCodesParser *parser = user_data; + + switch (parser->state) + { + case ISO_CODES_START: + if (strcmp (element_name, "iso_639_entries") == 0) + { + parser->state = ISO_CODES_IN_ENTRIES; + break; + } + + case ISO_CODES_IN_ENTRIES: + if (strcmp (element_name, "iso_639_entry") == 0) + { + parser->state = ISO_CODES_IN_ENTRY; + iso_codes_parser_entry (parser, attribute_names, attribute_values); + break; + } + + case ISO_CODES_IN_ENTRY: + case ISO_CODES_IN_UNKNOWN: + iso_codes_parser_start_unknown (parser); + break; + } +} + +static void +iso_codes_parser_end_element (GMarkupParseContext *context, + const gchar *element_name, + gpointer user_data, + GError **error) +{ + IsoCodesParser *parser = user_data; + + switch (parser->state) + { + case ISO_CODES_START: + g_warning ("%s: shouldn't get here", G_STRLOC); + break; + + case ISO_CODES_IN_ENTRIES: + parser->state = ISO_CODES_START; + break; + + case ISO_CODES_IN_ENTRY: + parser->state = ISO_CODES_IN_ENTRIES; + break; + + case ISO_CODES_IN_UNKNOWN: + iso_codes_parser_end_unknown (parser); + break; + } +} + +static void +iso_codes_parser_start_unknown (IsoCodesParser *parser) +{ + if (parser->unknown_depth == 0) + parser->last_known_state = parser->state; + + parser->state = ISO_CODES_IN_UNKNOWN; + parser->unknown_depth++; +} + +static void +iso_codes_parser_end_unknown (IsoCodesParser *parser) +{ + gimp_assert (parser->unknown_depth > 0 && + parser->state == ISO_CODES_IN_UNKNOWN); + + parser->unknown_depth--; + + if (parser->unknown_depth == 0) + parser->state = parser->last_known_state; +} +#endif /* HAVE_ISO_CODES */ |