aboutsummaryrefslogblamecommitdiffstats
path: root/lib/ephy-langs.c
blob: 793f179ce26be8d5c3dcdcb063e04d867ba1848c (plain) (tree)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16















                                                                              

        
   
 
                   
 
                       
 

                       
                       
 

                   



                             
                                                      
 












                                                                           
                                                                  


                                                                      


                                                                    

                             
 
                              

 

                            
 
                                
 






































                                                                              
                                                  
         
                                                          












                                                                          
                                                   
         
                                                          













































































                                                                                         





































































































































































































                                                                                               
/*
 *  Copyright (C) 2003 Christian Persch
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License as published by
 *  the Free Software Foundation; either version 2, or (at your option)
 *  any later version.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
 *  along with this program; if not, write to the Free Software
 *  Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
 *
 *  $Id$
 */

#include "config.h"

#include "ephy-langs.h"

#include "ephy-debug.h"

#include <glib/gi18n.h>

#include <string.h>

#ifdef HAVE_ISO_CODES
#include <libxml/xmlreader.h>
#endif

static const EphyFontsLanguageInfo font_languages [] =
{
    { N_("Arabic"),                 "ar" },
    { N_("Baltic"),                 "x-baltic" },
    { N_("Central European"),           "x-central-euro" },
    { N_("Cyrillic"),               "x-cyrillic" },
    { N_("Devanagari"),             "x-devanagari" },
    { N_("Greek"),                  "el" },
    { N_("Hebrew"),                 "he" },
    { N_("Japanese"),               "ja" },
    { N_("Korean"),                 "ko" },
    { N_("Simplified Chinese"),         "zh-CN" },
    { N_("Tamil"),                  "x-tamil" },
    { N_("Thai"),                   "th" },
    { N_("Traditional Chinese"),            "zh-TW" },
    { N_("Traditional Chinese (Hong Kong)"),    "zh-HK" },
    { N_("Turkish"),                "tr" },
    { N_("Unicode"),                "x-unicode" },
    { N_("Western"),                "x-western" }
};
static const guint n_font_languages = G_N_ELEMENTS (font_languages);

const EphyFontsLanguageInfo *
ephy_font_languages (void)
{
    return font_languages;
}

guint            
ephy_font_n_languages (void)
{
    return n_font_languages;
}

/* sanitise the languages list according to the rules for HTTP accept-language
 * in RFC 2616, Sect. 14.4
 */
void
ephy_langs_sanitise (GArray *array)
{
    char *lang1, *lang2;
    int i, j;

    /* if we have 'xy-ab' in list but not 'xy', append 'xy' */
    for (i = 0; i < array->len; i++)
    {
        gboolean found = FALSE;
        char *dash, *prefix;

        lang1 = (char *) g_array_index (array,char *, i);

        dash = strchr (lang1, '-');
        if (dash == NULL) continue;

        for (j = i + 1; j < array->len; j++)
        {
            lang2 = (char *) g_array_index (array, char *, j);
            if (strchr (lang2, '-') == NULL &&
                g_str_has_prefix (lang1, lang2))
            {
                found = TRUE;
            }
        }

        if (found == FALSE)
        {
            prefix = g_strndup (lang1, dash - lang1);
            g_array_append_val (array, prefix);
        }
    }

    /* uniquify */
    for (i = 0; i < (int) array->len - 1; i++)
    {
        for (j = (int) array->len - 1; j > i; j--)
        {
            lang1 = (char *) g_array_index (array,char *, i);
            lang2 = (char *) g_array_index (array, char *, j);

            if (strcmp (lang1, lang2) == 0)
            {
                g_array_remove_index (array, j);
                g_free (lang2);
            }
        }
    }

    /* move 'xy' code behind all 'xy-ab' codes */
    for (i = (int) array->len - 2; i >= 0; i--)
    {
        for (j = (int) array->len - 1; j > i; j--)
        {
            lang1 = (char *) g_array_index (array, char *, i);
            lang2 = (char *) g_array_index (array, char *, j);

            if (strchr (lang1, '-') == NULL &&
                strchr (lang2, '-') != NULL &&
                g_str_has_prefix (lang2, lang1))
            {
                g_array_insert_val (array, j + 1, lang1);
                g_array_remove_index (array, i);
                break;
            }
        }
    }
}

void
ephy_langs_append_languages (GArray *array)
{
    const char * const * languages;
    const char *system_lang;
    char *lang;
    int i;

    /**
    * This is a comma separated list of language ranges, as specified
    * by RFC 2616, 14.4.
    * Always include the basic language code last.
    *
    * Examples:
    * "pt"    translation: "pt"
    * "pt_BR" translation: "pt-br,pt"
    * "zh_CN" translation: "zh-cn,zh"
    * "zh_HK" translation: "zh-hk,zh" or maybe "zh-hk,zh-tw,zh"
    */
    system_lang = _("system-language");

    /* FIXME: use system_language when given, instead of g_get_language_names () ? */
    languages = g_get_language_names ();
    g_return_if_fail (languages != NULL);

    /* FIXME: maybe just use the first, instead of all of them? */
    for (i = 0; languages[i] != NULL; i++)
    {

        if (strstr (languages[i], ".") == 0 &&
            strstr (languages[i], "@") == 0 &&
            strcmp (languages[i], "C") != 0)
        {
            /* change to lowercase and '_' to '-' */
            lang = g_strdelimit (g_ascii_strdown
                        (languages[i], -1), "_", '-');

            g_array_append_val (array, lang);
        }
    }

    /* Fallback: add "en" if list is empty */
    if (array->len == 0)
    {
        lang = g_strdup ("en");
        g_array_append_val (array, lang);
    }
}

char **
ephy_langs_get_languages (void)
{
    GArray *array;

    array = g_array_new (TRUE, FALSE, sizeof (char *));

    ephy_langs_append_languages (array);

    ephy_langs_sanitise (array);

    return (char **) g_array_free (array, FALSE);
}

#ifdef HAVE_ISO_CODES

#define ISOCODESLOCALEDIR   ISO_CODES_PREFIX "/share/locale"

static void
ephy_langs_bind_iso_domains (void)
{
#ifdef ENABLE_NLS
    static gboolean bound = FALSE;

    if (bound == FALSE)
    {
            bindtextdomain (ISO_639_DOMAIN, ISOCODESLOCALEDIR);
            bind_textdomain_codeset (ISO_639_DOMAIN, "UTF-8");

            bindtextdomain(ISO_3166_DOMAIN, ISOCODESLOCALEDIR);
            bind_textdomain_codeset (ISO_3166_DOMAIN, "UTF-8");

        bound = TRUE;
    }
#endif
}

static void
read_iso_639_entry (xmlTextReaderPtr reader,
            GHashTable *table)
{
    xmlChar *code, *name;

    code = xmlTextReaderGetAttribute (reader, (const xmlChar *) "iso_639_1_code");
    name = xmlTextReaderGetAttribute (reader, (const xmlChar *) "name");

    /* Get iso-639-2 code */
    if (code == NULL || code[0] == '\0')
    {
        xmlFree (code);
        /* FIXME: use the 2T or 2B code? */
        code = xmlTextReaderGetAttribute (reader, (const xmlChar *) "iso_639_2T_code");
    }

    if (code != NULL && code[0] != '\0' && name != NULL && name[0] != '\0')
    {
        g_hash_table_insert (table, code, name);
    }
    else
    {
        xmlFree (code);
        xmlFree (name);
    }
}

static void
read_iso_3166_entry (xmlTextReaderPtr reader,
             GHashTable *table)
{
    xmlChar *code, *name;

    code = xmlTextReaderGetAttribute (reader, (const xmlChar *) "alpha_2_code");
    name = xmlTextReaderGetAttribute (reader, (const xmlChar *) "name");

    if (code != NULL && code[0] != '\0' && name != NULL && name[0] != '\0')
    {
        char *lcode;

        lcode = g_ascii_strdown ((char *) code, -1);
        xmlFree (code);

        g_hash_table_insert (table, lcode, name);
    }
    else
    {
        xmlFree (code);
        xmlFree (name);
    }

}

typedef enum
{
    STATE_START,
    STATE_STOP,
    STATE_ENTRIES,
} ParserState;

static gboolean
load_iso_entries (int iso,
          GFunc read_entry_func,
          gpointer user_data)
{
    xmlTextReaderPtr reader;
    ParserState state = STATE_START;
    xmlChar iso_entries[32], iso_entry[32];
    char *filename;
    int ret = -1;

    LOG ("Loading ISO-%d codes", iso)

    START_PROFILER ("Loading ISO codes")

    filename = g_strdup_printf (ISO_CODES_PREFIX "/share/xml/iso-codes/iso_%d.xml", iso);
    reader = xmlNewTextReaderFilename (filename);
    if (reader == NULL) goto out;

    xmlStrPrintf (iso_entries, sizeof (iso_entries), "iso_%d_entries", iso);
    xmlStrPrintf (iso_entry, sizeof (iso_entry), "iso_%d_entry", iso);

    ret = xmlTextReaderRead (reader);

    while (ret == 1)
    {
        const xmlChar *tag;
        xmlReaderTypes type;

        tag = xmlTextReaderConstName (reader);
        type = xmlTextReaderNodeType (reader);

        if (state == STATE_ENTRIES &&
            type == XML_READER_TYPE_ELEMENT &&
            xmlStrEqual (tag, iso_entry))
        {
            read_entry_func (reader, user_data);
        }
        else if (state == STATE_START &&
             type == XML_READER_TYPE_ELEMENT &&
             xmlStrEqual (tag, iso_entries))
        {
            state = STATE_ENTRIES;
        }
        else if (state == STATE_ENTRIES &&
             type == XML_READER_TYPE_END_ELEMENT &&
             xmlStrEqual (tag, iso_entries))
        {
            state = STATE_STOP;
        }
        else if (type == XML_READER_TYPE_SIGNIFICANT_WHITESPACE ||
             type == XML_READER_TYPE_WHITESPACE ||
             type == XML_READER_TYPE_TEXT ||
             type == XML_READER_TYPE_COMMENT)
        {
            /* eat it */
        }
        else
        {
            /* ignore it */
        }

        ret = xmlTextReaderRead (reader);
    }

    xmlFreeTextReader (reader);

out:
    if (ret < 0 || state != STATE_STOP)
    {
        g_warning ("Failed to load ISO-%d codes from %s!\n",
               iso, filename);
        return FALSE;
    }

    g_free (filename);

    STOP_PROFILER ("Loading ISO codes")

    return TRUE;
}

GHashTable *
ephy_langs_iso_639_table (void)
{
    GHashTable *table;

    ephy_langs_bind_iso_domains ();
    table = g_hash_table_new_full (g_str_hash, g_str_equal,
                       (GDestroyNotify) xmlFree,
                       (GDestroyNotify) xmlFree);

    load_iso_entries (639, (GFunc) read_iso_639_entry, table);

    return table;
}

GHashTable *
ephy_langs_iso_3166_table (void)
{
    GHashTable *table;

    ephy_langs_bind_iso_domains ();
    table = g_hash_table_new_full (g_str_hash, g_str_equal,
                       (GDestroyNotify) g_free,
                       (GDestroyNotify) xmlFree);
    
    load_iso_entries (3166, (GFunc) read_iso_3166_entry, table);

    return table;
}

#endif /* HAVE_ISO_CODES */