/* -*- Mode: C; tab-width: 8; indent-tabs-mode: t; c-basic-offset: 8 -*- */
/*
 *  Copyright © 2003 Marco Pesenti Gritti
 *  Copyright © 2003 Christian Persch
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License as published by
 *  the Free Software Foundation; either version 2, or (at your option)
 *  any later version.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
 *  along with this program; if not, write to the Free Software
 *  Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
 *
 */

#include "config.h"
#include "ephy-encodings.h"

#include "ephy-debug.h"
#include "ephy-prefs.h"
#include "ephy-settings.h"

#include <glib/gi18n.h>
#include <string.h>

#define EPHY_ENCODINGS_GET_PRIVATE(object)(G_TYPE_INSTANCE_GET_PRIVATE ((object), EPHY_TYPE_ENCODINGS, EphyEncodingsPrivate))

struct _EphyEncodingsPrivate
{
	GHashTable *hash;
	GSList *recent;
};

/*
 * translatable encodings titles
 * NOTE: if you add/remove/change encodings, please also update the schema in
 * epiphany.schemas.in
 */
static const 
struct
{
	char *title;
	char *code;
	EphyLanguageGroup groups;
}
encoding_entries [] =
{ 
	{ N_("Arabic (_IBM-864)"),                  "IBM864",                LG_ARABIC  },
	{ N_("Arabic (ISO-_8859-6)"),               "ISO-8859-6",            LG_ARABIC },
	{ N_("Arabic (_MacArabic)"),                "x-mac-arabic",          LG_ARABIC },
	{ N_("Arabic (_Windows-1256)"),             "windows-1256",          LG_ARABIC },
	{ N_("Baltic (_ISO-8859-13)"),              "ISO-8859-13",           LG_BALTIC },
	{ N_("Baltic (I_SO-8859-4)"),               "ISO-8859-4",            LG_BALTIC },
	{ N_("Baltic (_Windows-1257)"),             "windows-1257",          LG_BALTIC },
	{ N_("_Armenian (ARMSCII-8)"),              "armscii-8",             LG_CAUCASIAN },
	{ N_("_Georgian (GEOSTD8)"),                "geostd8",               LG_CAUCASIAN },
	{ N_("Central European (_IBM-852)"),        "IBM852",                LG_C_EUROPEAN },
	{ N_("Central European (I_SO-8859-2)"),     "ISO-8859-2",	     LG_C_EUROPEAN },
	{ N_("Central European (_MacCE)"),          "x-mac-ce",              LG_C_EUROPEAN },
	{ N_("Central European (_Windows-1250)"),   "windows-1250",          LG_C_EUROPEAN },
	{ N_("Chinese Simplified (_GB18030)"),      "gb18030",               LG_CHINESE_SIMP },
	{ N_("Chinese Simplified (G_B2312)"),       "GB2312",                LG_CHINESE_SIMP },
	{ N_("Chinese Simplified (GB_K)"),          "x-gbk",                 LG_CHINESE_SIMP },
	{ N_("Chinese Simplified (_HZ)"),           "HZ-GB-2312",	     LG_CHINESE_SIMP },
	{ N_("Chinese Simplified (_ISO-2022-CN)"),  "ISO-2022-CN",           LG_CHINESE_SIMP },
	{ N_("Chinese Traditional (Big_5)"),        "Big5",                  LG_CHINESE_TRAD },
	{ N_("Chinese Traditional (Big5-HK_SCS)"),  "Big5-HKSCS",	     LG_CHINESE_TRAD },
	{ N_("Chinese Traditional (_EUC-TW)"),      "x-euc-tw",              LG_CHINESE_TRAD },
	{ N_("Cyrillic (_IBM-855)"),                "IBM855",                LG_CYRILLIC },
	{ N_("Cyrillic (I_SO-8859-5)"),             "ISO-8859-5",	     LG_CYRILLIC },
	{ N_("Cyrillic (IS_O-IR-111)"),             "ISO-IR-111",	     LG_CYRILLIC },
	{ N_("Cyrillic (_KOI8-R)"),                 "KOI8-R",                LG_CYRILLIC },
	{ N_("Cyrillic (_MacCyrillic)"),            "x-mac-cyrillic",        LG_CYRILLIC },
	{ N_("Cyrillic (_Windows-1251)"),           "windows-1251",          LG_CYRILLIC },
	{ N_("Cyrillic/_Russian (IBM-866)"),        "IBM866",                LG_CYRILLIC },
	{ N_("Greek (_ISO-8859-7)"),                "ISO-8859-7",            LG_GREEK },
	{ N_("Greek (_MacGreek)"),                  "x-mac-greek",           LG_GREEK },
	{ N_("Greek (_Windows-1253)"),              "windows-1253",          LG_GREEK },
	{ N_("Gujarati (_MacGujarati)"),            "x-mac-gujarati",        LG_INDIAN },
	{ N_("Gurmukhi (Mac_Gurmukhi)"),            "x-mac-gurmukhi",        LG_INDIAN },
	{ N_("Hindi (Mac_Devanagari)"),             "x-mac-devanagari",      LG_INDIAN },
	{ N_("Hebrew (_IBM-862)"),                  "IBM862",                LG_HEBREW },
	{ N_("Hebrew (IS_O-8859-8-I)"),             "ISO-8859-8-I",          LG_HEBREW },
	{ N_("Hebrew (_MacHebrew)"),                "x-mac-hebrew",          LG_HEBREW },
	{ N_("Hebrew (_Windows-1255)"),             "windows-1255",          LG_HEBREW },
	{ N_("_Visual Hebrew (ISO-8859-8)"),        "ISO-8859-8",            LG_HEBREW },
	{ N_("Japanese (_EUC-JP)"),                 "EUC-JP",                LG_JAPANESE },
	{ N_("Japanese (_ISO-2022-JP)"),            "ISO-2022-JP",           LG_JAPANESE },
	{ N_("Japanese (_Shift-JIS)"),              "Shift_JIS",             LG_JAPANESE },
	{ N_("Korean (_EUC-KR)"),                   "EUC-KR",                LG_KOREAN },
	{ N_("Korean (_ISO-2022-KR)"),              "ISO-2022-KR",           LG_KOREAN },
	{ N_("Korean (_JOHAB)"),                    "x-johab",               LG_KOREAN },
	{ N_("Korean (_UHC)"),                      "x-windows-949",         LG_KOREAN },
	{ N_("_Celtic (ISO-8859-14)"),              "ISO-8859-14",           LG_NORDIC },
	{ N_("_Icelandic (MacIcelandic)"),          "x-mac-icelandic",       LG_NORDIC },
	{ N_("_Nordic (ISO-8859-10)"),              "ISO-8859-10",           LG_NORDIC },
	{ N_("_Persian (MacFarsi)"),                "x-mac-farsi",           LG_PERSIAN },
	{ N_("Croatian (Mac_Croatian)"),            "x-mac-croatian",        LG_SE_EUROPEAN },
	{ N_("_Romanian (MacRomanian)"),            "x-mac-romanian",        LG_SE_EUROPEAN },
	{ N_("R_omanian (ISO-8859-16)"),            "ISO-8859-16",           LG_SE_EUROPEAN },
	{ N_("South _European (ISO-8859-3)"),	    "ISO-8859-3",            LG_SE_EUROPEAN },
	{ N_("Thai (TIS-_620)"),                    "TIS-620",               LG_THAI },
	{ N_("Thai (IS_O-8859-11)"),                "iso-8859-11",           LG_THAI },
	{ N_("_Thai (Windows-874)"),                "windows-874",           LG_THAI },
	{ N_("Turkish (_IBM-857)"),                 "IBM857",                LG_TURKISH },
	{ N_("Turkish (I_SO-8859-9)"),              "ISO-8859-9",            LG_TURKISH },
	{ N_("Turkish (_MacTurkish)"),              "x-mac-turkish",         LG_TURKISH },
	{ N_("Turkish (_Windows-1254)"),            "windows-1254",          LG_TURKISH },
	{ N_("Unicode (UTF-_8)"),                   "UTF-8",                 LG_UNICODE },
	{ N_("Cyrillic/Ukrainian (_KOI8-U)"),       "KOI8-U",                LG_UKRAINIAN },
	{ N_("Cyrillic/Ukrainian (Mac_Ukrainian)"), "x-mac-ukrainian",       LG_UKRAINIAN },
	{ N_("Vietnamese (_TCVN)"),                 "x-viet-tcvn5712",       LG_VIETNAMESE },
	{ N_("Vietnamese (_VISCII)"),               "VISCII",                LG_VIETNAMESE },
	{ N_("Vietnamese (V_PS)"),                  "x-viet-vps",            LG_VIETNAMESE },
	{ N_("Vietnamese (_Windows-1258)"),         "windows-1258",          LG_VIETNAMESE },
	{ N_("Western (_IBM-850)"),                 "IBM850",                LG_WESTERN },
	{ N_("Western (_ISO-8859-1)"),              "ISO-8859-1",            LG_WESTERN },
	{ N_("Western (IS_O-8859-15)"),             "ISO-8859-15",           LG_WESTERN },
	{ N_("Western (_MacRoman)"),                "x-mac-roman",           LG_WESTERN },
	{ N_("Western (_Windows-1252)"),            "windows-1252",          LG_WESTERN },

	/* the following encodings are so rarely used that we don't want to pollute the "related"
	 * part of the encodings menu with them, so we set the language group to 0 here
	 */
	{ N_("English (_US-ASCII)"),                "us-ascii",              0 },
	{ N_("Unicode (UTF-_16 BE)"),               "UTF-16BE",              0 },
	{ N_("Unicode (UTF-1_6 LE)"),               "UTF-16LE",              0 },
	{ N_("Unicode (UTF-_32 BE)"),               "UTF-32BE",              0 },
	{ N_("Unicode (UTF-3_2 LE)"),               "UTF-32LE",              0 },
};

#define RECENT_MAX	4

G_DEFINE_TYPE (EphyEncodings, ephy_encodings, G_TYPE_OBJECT)

static void
ephy_encodings_finalize (GObject *object)
{
	EphyEncodings *encodings = EPHY_ENCODINGS (object);

	g_hash_table_destroy (encodings->priv->hash);

	g_slist_foreach (encodings->priv->recent, (GFunc)g_free, NULL);
	g_slist_free (encodings->priv->recent);

	LOG ("EphyEncodings finalised");

	G_OBJECT_CLASS (ephy_encodings_parent_class)->finalize (object);
}

static void
ephy_encodings_class_init (EphyEncodingsClass *klass)
{
	GObjectClass *object_class = G_OBJECT_CLASS (klass);

	object_class->finalize = ephy_encodings_finalize;

	/**
	 * EphyEncodings::encoding-added:
	 *
	 * The ::encoding-added signal is emitted when @encodings receives a new encoding.
	 **/
	g_signal_new ("encoding-added",
		      G_OBJECT_CLASS_TYPE (object_class),
		      G_SIGNAL_RUN_LAST,
		      0,
		      NULL, NULL,
		      g_cclosure_marshal_VOID__OBJECT,
		      G_TYPE_NONE,
		      1, G_TYPE_OBJECT);

	g_type_class_add_private (object_class, sizeof (EphyEncodingsPrivate));
}

/* copied from egg-toolbar-editor.c */
static char *
elide_underscores (const char *original)
{
	char *q, *result;
	const char *p;
	gboolean last_underscore;

	q = result = g_malloc (strlen (original) + 1);
	last_underscore = FALSE;

	for (p = original; *p; p++)
	{
		if (!last_underscore && *p == '_')
		{
			last_underscore = TRUE;
		}
		else
		{
			last_underscore = FALSE;
			*q++ = *p;
		}
	}

	*q = '\0';

	return result;
}

static EphyEncoding *
add_encoding (EphyEncodings *encodings,
	      const char *title,
	      const char *code,
	      EphyLanguageGroup groups)
{
	EphyEncoding *encoding;
	char *elided, *collate_key, *normalised;

	/* Create node. */
	elided = elide_underscores (title);
	normalised = g_utf8_normalize (elided, -1, G_NORMALIZE_DEFAULT);
	collate_key = g_utf8_collate_key (normalised, -1);

	encoding = ephy_encoding_new (code, title,
				      normalised, collate_key,
				      groups);
	/* Add it. */
	g_hash_table_insert (encodings->priv->hash, g_strdup (code), encoding);

	g_signal_emit_by_name (encodings, "encoding-added", encoding);

	g_free (collate_key);
	g_free (normalised);
	g_free (elided);

	return encoding;
}

EphyEncoding *
ephy_encodings_get_encoding (EphyEncodings *encodings,
			     const char *code,
			     gboolean add_if_not_found)
{
	EphyEncoding *encoding;

	g_return_val_if_fail (EPHY_IS_ENCODINGS (encodings), NULL);

	encoding = g_hash_table_lookup (encodings->priv->hash, code);

	/* if it doesn't exist, add a node for it */
	if (!EPHY_IS_ENCODING (encoding) && add_if_not_found)
	{
		char *title;

		/* Translators: this is the title that an unknown encoding will
		 * be displayed as.
		 */
		title = g_strdup_printf (_("Unknown (%s)"), code);
		encoding = add_encoding (encodings, title, code, 0);
		g_free (title);
	}

	return encoding;
}

typedef struct {
	GList *list;
	EphyLanguageGroup group_mask;
} GetEncodingsData;

static void
get_encodings_foreach (gpointer key,
		       gpointer value,
		       gpointer user_data)
{
	GetEncodingsData *data = (GetEncodingsData*)user_data;
	EphyLanguageGroup group;
	
	group = ephy_encoding_get_language_groups (EPHY_ENCODING (value));
	if ((group & data->group_mask) != 0)
	{
		data->list = g_list_prepend (data->list, value);
	}
}

GList *
ephy_encodings_get_encodings (EphyEncodings *encodings,
			      EphyLanguageGroup group_mask)
{
	GList *list = NULL;
	GetEncodingsData data;

	data.list = list;
	data.group_mask = group_mask;

	g_hash_table_foreach (encodings->priv->hash, (GHFunc)get_encodings_foreach, &data);

	return list;
}

static void
get_all_encodings (gpointer key,
		   gpointer value,
		   gpointer user_data)
{
	GList **l = (GList**)user_data;

	*l = g_list_prepend (*l, value);
}

GList *
ephy_encodings_get_all (EphyEncodings *encodings)
{
	GList *l = NULL;

	g_return_val_if_fail (EPHY_IS_ENCODINGS (encodings), NULL);

	g_hash_table_foreach (encodings->priv->hash, (GHFunc)get_all_encodings, &l);

	return l;
}

void
ephy_encodings_add_recent (EphyEncodings *encodings,
			   const char *code)
{
	GSList *element, *l;
	GVariantBuilder builder;
	EphyEncodingsPrivate *priv = encodings->priv;

	g_return_if_fail (EPHY_IS_ENCODINGS (encodings));
	g_return_if_fail (code != NULL);
	
	if (ephy_encodings_get_encoding (encodings, code, FALSE) == NULL)
		return;

	/* Keep the list elements unique. */
	element = g_slist_find_custom (priv->recent, code,
				       (GCompareFunc)strcmp);
	if (element != NULL)
	{
		g_free (element->data);
		priv->recent =
			g_slist_remove_link (priv->recent, element);
	}

	/* Add the new code upfront. */
	priv->recent =
		g_slist_prepend (priv->recent, g_strdup (code));

	/* Truncate the list if necessary; it's at most 1 element too much. */
	if (g_slist_length (priv->recent) > RECENT_MAX)
	{
		GSList *tail;

		tail = g_slist_last (priv->recent);
		g_free (tail->data);
		priv->recent =
			g_slist_remove_link (priv->recent, tail);
	}

	g_variant_builder_init (&builder, G_VARIANT_TYPE_STRING_ARRAY);
	for (l = priv->recent; l; l = l->next)
	{
		g_variant_builder_add (&builder, "s", l->data);
	}

	g_settings_set (EPHY_SETTINGS_STATE,
			EPHY_PREFS_STATE_RECENT_ENCODINGS,
			"as", &builder);
}

GList *
ephy_encodings_get_recent (EphyEncodings *encodings)
{
	GSList *l;
	GList *list = NULL;

	g_return_val_if_fail (EPHY_IS_ENCODINGS (encodings), NULL);

	for (l = encodings->priv->recent; l != NULL; l = l->next)
	{
		EphyEncoding *encoding;

		encoding = ephy_encodings_get_encoding (encodings, (char *)l->data, FALSE);
		g_return_val_if_fail (EPHY_IS_ENCODING (encoding), NULL);

		list = g_list_prepend (list, encoding);
	}

	return list;
}

static void
ephy_encodings_init (EphyEncodings *encodings)
{
	char **list;
	int i;

	encodings->priv = EPHY_ENCODINGS_GET_PRIVATE (encodings);

	LOG ("EphyEncodings initialising");

	encodings->priv->hash = g_hash_table_new_full (g_str_hash, g_str_equal,
						       (GDestroyNotify)g_free,
						       (GDestroyNotify)g_object_unref);

	/* Fill the db. */
	for (i = 0; i < G_N_ELEMENTS (encoding_entries); i++)
	{
		add_encoding (encodings,
                              _(encoding_entries[i].title),
			      encoding_entries[i].code,
			      encoding_entries[i].groups);
	}

	/* Get the list of recently used encodings. */
	list = g_settings_get_strv (EPHY_SETTINGS_STATE,
				    EPHY_PREFS_STATE_RECENT_ENCODINGS);

	/* Make sure the list has no duplicates (GtkUIManager goes
	 * crazy otherwise), and only valid entries.
	 */
	encodings->priv->recent = NULL;
	for (i = 0; list[i]; i++)
	{
		char *item;
		item = list[i];

		if (g_slist_find (encodings->priv->recent, item) == NULL
		    && g_slist_length (encodings->priv->recent) < RECENT_MAX
		    && ephy_encodings_get_encoding (encodings, item, FALSE) != NULL)
		{
			encodings->priv->recent =
				g_slist_prepend (encodings->priv->recent,
						 g_strdup (item));
		}
	}
	encodings->priv->recent = g_slist_reverse (encodings->priv->recent);
	g_strfreev (list);
}

EphyEncodings *
ephy_encodings_new (void)
{
	return g_object_new (EPHY_TYPE_ENCODINGS, NULL);
}