1 /* libxmms-flac - XMMS FLAC input plugin
2  * Copyright (C) 2002,2003,2004,2005,2006,2007,2008,2009  Daisuke Shimamura
3  *
4  * Almost from charset.c
5  *  EasyTAG - Tag editor for MP3 and OGG files
6  *  Copyright (C) 1999-2001  H�vard Kv�len <havardk@xmms.org>
7  *
8  * This program is free software; you can redistribute it and/or
9  * modify it under the terms of the GNU General Public License
10  * as published by the Free Software Foundation; either version 2
11  * of the License, or (at your option) any later version.
12  *
13  * This program is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
16  * GNU General Public License for more details.
17  *
18  * You should have received a copy of the GNU General Public License along
19  * with this program; if not, write to the Free Software Foundation, Inc.,
20  * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
21  */
22 
23 #ifdef HAVE_CONFIG_H
24 #include "config.h"
25 #endif
26 
27 #include "plugin.h"
28 
29 #include <stdlib.h>
30 #include <glib.h>
31 #include <string.h>
32 #include <errno.h>
33 
34 #include "plugin_common/charset.h"
35 #include "charset.h"
36 #include "configure.h"
37 #include "locale_hack.h"
38 
39 
40 /****************
41  * Declarations *
42  ****************/
43 
44 #define CHARSET_TRANS_ARRAY_LEN ( sizeof(charset_trans_array) / sizeof((charset_trans_array)[0]) )
45 const CharsetInfo charset_trans_array[] = {
46 	{N_("Arabic (IBM-864)"),                  "IBM864"        },
47 	{N_("Arabic (ISO-8859-6)"),               "ISO-8859-6"    },
48 	{N_("Arabic (Windows-1256)"),             "windows-1256"  },
49 	{N_("Baltic (ISO-8859-13)"),              "ISO-8859-13"   },
50 	{N_("Baltic (ISO-8859-4)"),               "ISO-8859-4"    },
51 	{N_("Baltic (Windows-1257)"),             "windows-1257"  },
52 	{N_("Celtic (ISO-8859-14)"),              "ISO-8859-14"   },
53 	{N_("Central European (IBM-852)"),        "IBM852"        },
54 	{N_("Central European (ISO-8859-2)"),     "ISO-8859-2"    },
55 	{N_("Central European (Windows-1250)"),   "windows-1250"  },
56 	{N_("Chinese Simplified (GB18030)"),      "gb18030"       },
57 	{N_("Chinese Simplified (GB2312)"),       "GB2312"        },
58 	{N_("Chinese Traditional (Big5)"),        "Big5"          },
59 	{N_("Chinese Traditional (Big5-HKSCS)"),  "Big5-HKSCS"    },
60 	{N_("Cyrillic (IBM-855)"),                "IBM855"        },
61 	{N_("Cyrillic (ISO-8859-5)"),             "ISO-8859-5"    },
62 	{N_("Cyrillic (ISO-IR-111)"),             "ISO-IR-111"    },
63 	{N_("Cyrillic (KOI8-R)"),                 "KOI8-R"        },
64 	{N_("Cyrillic (Windows-1251)"),           "windows-1251"  },
65 	{N_("Cyrillic/Russian (CP-866)"),         "IBM866"        },
66 	{N_("Cyrillic/Ukrainian (KOI8-U)"),       "KOI8-U"        },
67 	{N_("English (US-ASCII)"),                "us-ascii"      },
68 	{N_("Greek (ISO-8859-7)"),                "ISO-8859-7"    },
69 	{N_("Greek (Windows-1253)"),              "windows-1253"  },
70 	{N_("Hebrew (IBM-862)"),                  "IBM862"        },
71 	{N_("Hebrew (Windows-1255)"),             "windows-1255"  },
72 	{N_("Japanese (EUC-JP)"),                 "EUC-JP"        },
73 	{N_("Japanese (ISO-2022-JP)"),            "ISO-2022-JP"   },
74 	{N_("Japanese (Shift_JIS)"),              "Shift_JIS"     },
75 	{N_("Korean (EUC-KR)"),                   "EUC-KR"        },
76 	{N_("Nordic (ISO-8859-10)"),              "ISO-8859-10"   },
77 	{N_("South European (ISO-8859-3)"),       "ISO-8859-3"    },
78 	{N_("Thai (TIS-620)"),                    "TIS-620"       },
79 	{N_("Turkish (IBM-857)"),                 "IBM857"        },
80 	{N_("Turkish (ISO-8859-9)"),              "ISO-8859-9"    },
81 	{N_("Turkish (Windows-1254)"),            "windows-1254"  },
82 	{N_("Unicode (UTF-7)"),                   "UTF-7"         },
83 	{N_("Unicode (UTF-8)"),                   "UTF-8"         },
84 	{N_("Unicode (UTF-16BE)"),                "UTF-16BE"      },
85 	{N_("Unicode (UTF-16LE)"),                "UTF-16LE"      },
86 	{N_("Unicode (UTF-32BE)"),                "UTF-32BE"      },
87 	{N_("Unicode (UTF-32LE)"),                "UTF-32LE"      },
88 	{N_("Vietnamese (VISCII)"),               "VISCII"        },
89 	{N_("Vietnamese (Windows-1258)"),         "windows-1258"  },
90 	{N_("Visual Hebrew (ISO-8859-8)"),        "ISO-8859-8"    },
91 	{N_("Western (IBM-850)"),                 "IBM850"        },
92 	{N_("Western (ISO-8859-1)"),              "ISO-8859-1"    },
93 	{N_("Western (ISO-8859-15)"),             "ISO-8859-15"   },
94 	{N_("Western (Windows-1252)"),            "windows-1252"  }
95 
96 	/*
97 	 * From this point, character sets aren't supported by iconv
98 	 */
99 #if 0
100 	{N_("Arabic (IBM-864-I)"),                "IBM864i"              },
101 	{N_("Arabic (ISO-8859-6-E)"),             "ISO-8859-6-E"         },
102 	{N_("Arabic (ISO-8859-6-I)"),             "ISO-8859-6-I"         },
103 	{N_("Arabic (MacArabic)"),                "x-mac-arabic"         },
104 	{N_("Armenian (ARMSCII-8)"),              "armscii-8"            },
105 	{N_("Central European (MacCE)"),          "x-mac-ce"             },
106 	{N_("Chinese Simplified (GBK)"),          "x-gbk"                },
107 	{N_("Chinese Simplified (HZ)"),           "HZ-GB-2312"           },
108 	{N_("Chinese Traditional (EUC-TW)"),      "x-euc-tw"             },
109 	{N_("Croatian (MacCroatian)"),            "x-mac-croatian"       },
110 	{N_("Cyrillic (MacCyrillic)"),            "x-mac-cyrillic"       },
111 	{N_("Cyrillic/Ukrainian (MacUkrainian)"), "x-mac-ukrainian"      },
112 	{N_("Farsi (MacFarsi)"),                  "x-mac-farsi"},
113 	{N_("Greek (MacGreek)"),                  "x-mac-greek"          },
114 	{N_("Gujarati (MacGujarati)"),            "x-mac-gujarati"       },
115 	{N_("Gurmukhi (MacGurmukhi)"),            "x-mac-gurmukhi"       },
116 	{N_("Hebrew (ISO-8859-8-E)"),             "ISO-8859-8-E"         },
117 	{N_("Hebrew (ISO-8859-8-I)"),             "ISO-8859-8-I"         },
118 	{N_("Hebrew (MacHebrew)"),                "x-mac-hebrew"         },
119 	{N_("Hindi (MacDevanagari)"),             "x-mac-devanagari"     },
120 	{N_("Icelandic (MacIcelandic)"),          "x-mac-icelandic"      },
121 	{N_("Korean (JOHAB)"),                    "x-johab"              },
122 	{N_("Korean (UHC)"),                      "x-windows-949"        },
123 	{N_("Romanian (MacRomanian)"),            "x-mac-romanian"       },
124 	{N_("Turkish (MacTurkish)"),              "x-mac-turkish"        },
125 	{N_("User Defined"),                      "x-user-defined"       },
126 	{N_("Vietnamese (TCVN)"),                 "x-viet-tcvn5712"      },
127 	{N_("Vietnamese (VPS)"),                  "x-viet-vps"           },
128 	{N_("Western (MacRoman)"),                "x-mac-roman"          },
129 	/* charsets whithout posibly translatable names */
130 	{"T61.8bit",                              "T61.8bit"             },
131 	{"x-imap4-modified-utf7",                 "x-imap4-modified-utf7"},
132 	{"x-u-escaped",                           "x-u-escaped"          },
133 	{"windows-936",                           "windows-936"          }
134 #endif
135 };
136 
137 /*************
138  * Functions *
139  *************/
140 
141 /*
142  * Commons conversion functions
143  */
convert_from_utf8_to_user(const char * string)144 char *convert_from_utf8_to_user(const char *string)
145 {
146 	return FLAC_plugin__charset_convert_string(string, "UTF-8", flac_cfg.title.user_char_set);
147 }
148 
convert_from_user_to_utf8(const char * string)149 char *convert_from_user_to_utf8(const char *string)
150 {
151 	return FLAC_plugin__charset_convert_string(string, flac_cfg.title.user_char_set, "UTF-8");
152 }
153 
Charset_Create_List(void)154 GList *Charset_Create_List (void)
155 {
156 	GList *list = NULL;
157 	guint i;
158 
159 	for (i=0; i<CHARSET_TRANS_ARRAY_LEN; i++)
160 		list = g_list_append(list,_(charset_trans_array[i].charset_title));
161 	return list;
162 }
163 
Charset_Create_List_UTF8_Only(void)164 GList *Charset_Create_List_UTF8_Only (void)
165 {
166 	GList *list = NULL;
167 
168 	list = g_list_append(list,_(Charset_Get_Title_From_Name("UTF-8")));
169 	return list;
170 }
171 
172 
173 /*
174  * Return charset_name from charset_title
175  */
Charset_Get_Name_From_Title(gchar * charset_title)176 gchar *Charset_Get_Name_From_Title (gchar *charset_title)
177 {
178 	guint i;
179 
180 	if (charset_title)
181 		for (i=0; i<CHARSET_TRANS_ARRAY_LEN; i++)
182 			if ( strcasecmp(_(charset_title),_(charset_trans_array[i].charset_title)) == 0 )
183 				return charset_trans_array[i].charset_name;
184 	return "";
185 }
186 
187 
188 /*
189  * Return charset_title from charset_name
190  */
Charset_Get_Title_From_Name(gchar * charset_name)191 gchar *Charset_Get_Title_From_Name (gchar *charset_name)
192 {
193 	guint i;
194 
195 	if (charset_name)
196 		for (i=0; i<CHARSET_TRANS_ARRAY_LEN; i++)
197 			if ( strcasecmp(charset_name,charset_trans_array[i].charset_name) == 0 )
198 				return _(charset_trans_array[i].charset_title);
199 	return "";
200 }
201