/* -*- Mode: C; tab-width: 8; indent-tabs-mode: t; c-basic-offset: 8 -*- */
/*
* Copyright (C) 2004-2007 Imendio AB
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License as
* published by the Free Software Foundation; either version 2 of the
* License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* General Public License for more details.
*
* You should have received a copy of the GNU General Public
* License along with this program; if not, write to the
* Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,
* Boston, MA 02110-1301 USA
*
* Authors: Martyn Russell <martyn@imendio.com>
* Richard Hult <richard@imendio.com>
*/
#include "config.h"
#include <string.h>
#include <stdlib.h>
#include <glib/gi18n-lib.h>
#ifdef HAVE_ENCHANT
#include <enchant.h>
#endif
#include "empathy-spell.h"
#define DEBUG_FLAG EMPATHY_DEBUG_OTHER
#include <libempathy/empathy-debug.h>
#include <libempathy/empathy-gsettings.h>
#ifdef HAVE_ENCHANT
typedef struct {
EnchantBroker *config;
EnchantDict *speller;
} SpellLanguage;
#define ISO_CODES_DATADIR ISO_CODES_PREFIX "/share/xml/iso-codes"
#define ISO_CODES_LOCALESDIR ISO_CODES_PREFIX "/share/locale"
/* Language code (gchar *) -> language name (gchar *) */
static GHashTable *iso_code_names = NULL;
/* Contains only _enabled_ languages
* Language code (gchar *) -> language (SpellLanguage *) */
static GHashTable *languages = NULL;
static void
spell_iso_codes_parse_start_tag (GMarkupParseContext *ctx,
const gchar *element_name,
const gchar **attr_names,
const gchar **attr_values,
gpointer data,
GError **error)
{
const gchar *ccode_longB, *ccode_longT, *ccode;
const gchar *lang_name;
if (!g_str_equal (element_name, "iso_639_entry") ||
attr_names == NULL || attr_values == NULL) {
return;
}
ccode = NULL;
ccode_longB = NULL;
ccode_longT = NULL;
lang_name = NULL;
while (*attr_names && *attr_values) {
if (g_str_equal (*attr_names, "iso_639_1_code")) {
if (**attr_values) {
ccode = *attr_values;
}
}
else if (g_str_equal (*attr_names, "iso_639_2B_code")) {
if (**attr_values) {
ccode_longB = *attr_values;
}
}
else if (g_str_equal (*attr_names, "iso_639_2T_code")) {
if (**attr_values) {
ccode_longT = *attr_values;
}
}
else if (g_str_equal (*attr_names, "name")) {
lang_name = *attr_values;
}
attr_names++;
attr_values++;
}
if (!lang_name) {
return;
}
if (ccode) {
g_hash_table_insert (iso_code_names,
g_strdup (ccode),
g_strdup (lang_name));
}
if (ccode_longB) {
g_hash_table_insert (iso_code_names,
g_strdup (ccode_longB),
g_strdup (lang_name));
}
if (ccode_longT) {
g_hash_table_insert (iso_code_names,
g_strdup (ccode_longT),
g_strdup (lang_name));
}
}
static void
spell_iso_code_names_init (void)
{
GError *err = NULL;
gchar *buf;
gsize buf_len;
iso_code_names = g_hash_table_new_full (g_str_hash, g_str_equal,
g_free, g_free);
bindtextdomain ("iso_639", ISO_CODES_LOCALESDIR);
bind_textdomain_codeset ("iso_639", "UTF-8");
/* FIXME: We should read this in chunks and pass to the parser. */
if (g_file_get_contents (ISO_CODES_DATADIR "/iso_639.xml", &buf, &buf_len, &err)) {
GMarkupParseContext *ctx;
GMarkupParser parser = {
spell_iso_codes_parse_start_tag,
NULL, NULL, NULL, NULL
};
ctx = g_markup_parse_context_new (&parser, 0, NULL, NULL);
if (!g_markup_parse_context_parse (ctx, buf, buf_len, &err)) {
g_warning ("Failed to parse '%s': %s",
ISO_CODES_DATADIR"/iso_639.xml",
err->message);
g_error_free (err);
}
g_markup_parse_context_free (ctx);
g_free (buf);
} else {
g_warning ("Failed to load '%s': %s",
ISO_CODES_DATADIR"/iso_639.xml", err->message);
g_error_free (err);
}
}
static void
spell_notify_languages_cb (GSettings *gsettings,
const gchar *key,
gpointer user_data)
{
DEBUG ("Resetting languages due to config change");
/* We just reset the languages list. */
if (languages != NULL) {
g_hash_table_destroy (languages);
languages = NULL;
}
}
static void
empathy_spell_free_language (SpellLanguage *lang)
{
enchant_broker_free_dict (lang->config, lang->speller);
enchant_broker_free (lang->config);
g_slice_free (SpellLanguage, lang);
}
static void
spell_setup_languages (void)
{
static GSettings *gsettings = NULL;
gchar *str;
if (gsettings == NULL) {
/* FIXME: this is never uninitialised */
gsettings = g_settings_new (EMPATHY_PREFS_CHAT_SCHEMA);
g_signal_connect (gsettings,
"changed::" EMPATHY_PREFS_CHAT_SPELL_CHECKER_LANGUAGES,
G_CALLBACK (spell_notify_languages_cb), NULL);
}
if (languages) {
return;
}
languages = g_hash_table_new_full (g_str_hash, g_str_equal,
g_free, (GDestroyNotify) empathy_spell_free_language);
str = g_settings_get_string (gsettings,
EMPATHY_PREFS_CHAT_SPELL_CHECKER_LANGUAGES);
if (str != NULL) {
gchar **strv;
gint i;
strv = g_strsplit (str, ",", -1);
i = 0;
while (strv && strv[i]) {
SpellLanguage *lang;
DEBUG ("Setting up language:'%s'", strv[i]);
lang = g_slice_new0 (SpellLanguage);
lang->config = enchant_broker_init ();
lang->speller = enchant_broker_request_dict (lang->config, strv[i]);
if (lang->speller == NULL) {
DEBUG ("language '%s' has no valid dict", strv[i]);
} else {
g_hash_table_insert (languages,
g_strdup (strv[i]),
lang);
}
i++;
}
if (strv) {
g_strfreev (strv);
}
g_free (str);
}
}
const gchar *
empathy_spell_get_language_name (const gchar *code)
{
const gchar *name;
g_return_val_if_fail (code != NULL, NULL);
if (!iso_code_names) {
spell_iso_code_names_init ();
}
name = g_hash_table_lookup (iso_code_names, code);
if (!name) {
return NULL;
}
return dgettext ("iso_639", name);
}
static void
enumerate_dicts (const gchar * const lang_tag,
const gchar * const provider_name,
const gchar * const provider_desc,
const gchar * const provider_file,
gpointer user_data)
{
GList **list = user_data;
gchar *lang = g_strdup (lang_tag);
if (strchr (lang, '_')) {
/* cut country part out of language */
strchr (lang, '_')[0] = '\0';
}
if (g_list_find_custom (*list, lang, (GCompareFunc) strcmp)) {
/* this language is already part of the list */
g_free (lang);
return;
}
*list = g_list_append (*list, g_strdup (lang));
}
GList *
empathy_spell_get_language_codes (void)
{
EnchantBroker *broker;
GList *list_langs = NULL;
broker = enchant_broker_init ();
enchant_broker_list_dicts (broker, enumerate_dicts, &list_langs);
enchant_broker_free (broker);
return list_langs;
}
GList *
empathy_spell_get_enabled_language_codes (void)
{
spell_setup_languages ();
return g_hash_table_get_keys (languages);
}
void
empathy_spell_free_language_codes (GList *codes)
{
g_list_foreach (codes, (GFunc) g_free, NULL);
g_list_free (codes);
}
gboolean
empathy_spell_check (const gchar *word)
{
gint enchant_result = 1;
const gchar *p;
gboolean digit;
gunichar c;
gint len;
GHashTableIter iter;
SpellLanguage *lang;
g_return_val_if_fail (word != NULL, FALSE);
spell_setup_languages ();
if (!languages) {
return TRUE;
}
/* Ignore certain cases like numbers, etc. */
for (p = word, digit = TRUE; *p && digit; p = g_utf8_next_char (p)) {
c = g_utf8_get_char (p);
digit = g_unichar_isdigit (c);
}
if (digit) {
/* We don't spell check digits. */
DEBUG ("Not spell checking word:'%s', it is all digits", word);
return TRUE;
}
len = strlen (word);
g_hash_table_iter_init (&iter, languages);
while (g_hash_table_iter_next (&iter, NULL, (gpointer *) &lang)) {
enchant_result = enchant_dict_check (lang->speller, word, len);
if (enchant_result == 0) {
break;
}
}
return (enchant_result == 0);
}
GList *
empathy_spell_get_suggestions (const gchar *code,
const gchar *word)
{
gint len;
GList *suggestion_list = NULL;
SpellLanguage *lang;
gchar **suggestions;
gsize i, number_of_suggestions;
g_return_val_if_fail (code != NULL, NULL);
g_return_val_if_fail (word != NULL, NULL);
spell_setup_languages ();
if (!languages) {
return NULL;
}
len = strlen (word);
lang = g_hash_table_lookup (languages, code);
if (!lang) {
return NULL;
}
suggestions = enchant_dict_suggest (lang->speller, word, len,
&number_of_suggestions);
for (i = 0; i < number_of_suggestions; i++) {
suggestion_list = g_list_append (suggestion_list,
g_strdup (suggestions[i]));
}
if (suggestions) {
enchant_dict_free_string_list (lang->speller, suggestions);
}
return suggestion_list;
}
gboolean
empathy_spell_supported (void)
{
if (g_getenv ("EMPATHY_SPELL_DISABLED")) {
DEBUG ("EMPATHY_SPELL_DISABLE env variable defined");
return FALSE;
}
return TRUE;
}
void
empathy_spell_add_to_dictionary (const gchar *code,
const gchar *word)
{
SpellLanguage *lang;
g_return_if_fail (code != NULL);
g_return_if_fail (word != NULL);
spell_setup_languages ();
if (languages == NULL)
return;
lang = g_hash_table_lookup (languages, code);
if (lang == NULL)
return;
enchant_dict_add_to_pwl (lang->speller, word, strlen (word));
}
#else /* not HAVE_ENCHANT */
gboolean
empathy_spell_supported (void)
{
return FALSE;
}
GList *
empathy_spell_get_suggestions (const gchar *word)
{
DEBUG ("Support disabled, could not get suggestions");
return NULL;
}
gboolean
empathy_spell_check (const gchar *word)
{
DEBUG ("Support disabled, could not check spelling");
return TRUE;
}
const gchar *
empathy_spell_get_language_name (const gchar *lang)
{
DEBUG ("Support disabled, could not get language name");
return NULL;
}
GList *
empathy_spell_get_language_codes (void)
{
DEBUG ("Support disabled, could not get language codes");
return NULL;
}
void
empathy_spell_free_language_codes (GList *codes)
{
}
void
empathy_spell_add_to_dictionary (const gchar *code,
const gchar *word)
{
DEBUG ("Support disabled, could not expand the dictionary");
}
#endif /* HAVE_ENCHANT */
void
empathy_spell_free_suggestions (GList *suggestions)
{
g_list_foreach (suggestions, (GFunc) g_free, NULL);
g_list_free (suggestions);
}