static void conv_utf8toeuc(gchar *outbuf, gint outlen, const gchar *inbuf);
static void conv_utf8tojis(gchar *outbuf, gint outlen, const gchar *inbuf);
-static void conv_unreadable_eucjp(gchar *str);
static void conv_unreadable_8bit(gchar *str);
-static void conv_unreadable_latin(gchar *str);
static void conv_jistodisp(gchar *outbuf, gint outlen, const gchar *inbuf);
static void conv_sjistodisp(gchar *outbuf, gint outlen, const gchar *inbuf);
conv_euctojis(outbuf, outlen, eucstr);
}
-static gchar valid_eucjp_tbl[][96] = {
- /* 0xa2a0 - 0xa2ff */
- { 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0,
- 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1,
- 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1,
- 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0,
- 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0 },
-
- /* 0xa3a0 - 0xa3ff */
- { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0,
- 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0,
- 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0 },
-
- /* 0xa4a0 - 0xa4ff */
- { 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
-
- /* 0xa5a0 - 0xa5ff */
- { 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
-
- /* 0xa6a0 - 0xa6ff */
- { 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0,
- 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0,
- 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
- 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
-
- /* 0xa7a0 - 0xa7ff */
- { 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
- 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
-
- /* 0xa8a0 - 0xa8ff */
- { 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
- 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
- 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
- 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }
-};
-
-static gboolean isprintableeuckanji(guchar c1, guchar c2)
-{
- if (c1 <= 0xa0 || c1 >= 0xf5)
- return FALSE;
- if (c2 <= 0xa0 || c2 == 0xff)
- return FALSE;
-
- if (c1 >= 0xa9 && c1 <= 0xaf)
- return FALSE;
-
- if (c1 >= 0xa2 && c1 <= 0xa8)
- return (gboolean)valid_eucjp_tbl[c1 - 0xa2][c2 - 0xa0];
-
- if (c1 == 0xcf) {
- if (c2 >= 0xd4 && c2 <= 0xfe)
- return FALSE;
- } else if (c1 == 0xf4) {
- if (c2 >= 0xa7 && c2 <= 0xfe)
- return FALSE;
- }
-
- return TRUE;
-}
-
-static void conv_unreadable_eucjp(gchar *str)
-{
- register guchar *p = str;
-
- while (*p != '\0') {
- if (IS_ASCII(*p)) {
- /* convert CR+LF -> LF */
- if (*p == '\r' && *(p + 1) == '\n')
- memmove(p, p + 1, strlen(p));
- /* printable 7 bit code */
- p++;
- } else if (iseuckanji(*p)) {
- if (isprintableeuckanji(*p, *(p + 1))) {
- /* printable euc-jp code */
- p += 2;
- } else {
- /* substitute unprintable code */
- *p++ = SUBST_CHAR;
- if (*p != '\0') {
- if (IS_ASCII(*p))
- p++;
- else
- *p++ = SUBST_CHAR;
- }
- }
- } else if (iseuchwkana1(*p)) {
- if (iseuchwkana2(*(p + 1)))
- /* euc-jp hankaku kana */
- p += 2;
- else
- *p++ = SUBST_CHAR;
- } else if (iseucaux(*p)) {
- if (iseuckanji(*(p + 1)) && iseuckanji(*(p + 2))) {
- /* auxiliary kanji */
- p += 3;
- } else
- *p++ = SUBST_CHAR;
- } else
- /* substitute unprintable 1 byte code */
- *p++ = SUBST_CHAR;
- }
-}
-
static void conv_unreadable_8bit(gchar *str)
{
register guchar *p = str;
}
}
-static void conv_unreadable_latin(gchar *str)
-{
- register guchar *p = str;
-
- while (*p != '\0') {
- /* convert CR+LF -> LF */
- if (*p == '\r' && *(p + 1) == '\n')
- memmove(p, p + 1, strlen(p));
- else if ((*p & 0xff) >= 0x7f && (*p & 0xff) <= 0x9f)
- *p = SUBST_CHAR;
- p++;
- }
-}
-
#define NCV '\0'
void conv_mb_alnum(gchar *str)
tmpstr = conv_iconv_strdup(inbuf, conv_get_locale_charset_str(),
CS_INTERNAL);
- if (tmpstr) {
+ if (tmpstr && g_utf8_validate(tmpstr, -1, NULL)) {
strncpy2(outbuf, tmpstr, outlen);
g_free(tmpstr);
+ } else if (tmpstr && !g_utf8_validate(tmpstr, -1, NULL)) {
+ g_free(tmpstr);
+ conv_utf8todisp(outbuf, outlen, inbuf);
} else
conv_utf8todisp(outbuf, outlen, inbuf);
}
/* auto detection mode */
if (!src_charset_str && !dest_charset_str) {
- if (src_charset == C_EUC_JP || src_charset == C_SHIFT_JIS)
+ if (conv_is_ja_locale())
return conv_anytodisp;
else
return conv_noconv;
{"ja_JP.ujis" , C_EUC_JP , C_ISO_2022_JP},
{"ja_JP.SJIS" , C_SHIFT_JIS , C_ISO_2022_JP},
{"ja_JP.JIS" , C_ISO_2022_JP , C_ISO_2022_JP},
+#ifdef G_OS_WIN32
+ {"ja_JP" , C_SHIFT_JIS , C_ISO_2022_JP},
+#else
{"ja_JP" , C_EUC_JP , C_ISO_2022_JP},
+#endif
{"ko_KR.EUC-KR" , C_EUC_KR , C_EUC_KR},
{"ko_KR" , C_EUC_KR , C_EUC_KR},
{"zh_CN.GB2312" , C_GB2312 , C_GB2312},
return out_charset;
}
+ if (strcasestr(cur_locale, "UTF-8")) {
+ out_charset = C_UTF_8;
+ return out_charset;
+ }
+
if ((p = strcasestr(cur_locale, "@euro")) && p[5] == '\0') {
out_charset = C_ISO_8859_15;
return out_charset;
CharSet out_charset;
const gchar *str;
- if (prefs_common.outgoing_charset) {
- if (!isalpha((guchar)prefs_common.outgoing_charset[0])) {
- g_free(prefs_common.outgoing_charset);
- prefs_common.outgoing_charset = g_strdup(CS_AUTO);
- } else if (strcmp(prefs_common.outgoing_charset, CS_AUTO) != 0)
- return prefs_common.outgoing_charset;
- }
-
out_charset = conv_get_outgoing_charset();
str = conv_get_charset_str(out_charset);
{
const gchar *cur_locale;
+#ifdef G_OS_WIN32
+ cur_locale = g_win32_getlocale();
+#else
cur_locale = g_getenv("LC_ALL");
if (!cur_locale) cur_locale = g_getenv("LC_CTYPE");
if (!cur_locale) cur_locale = g_getenv("LANG");
if (!cur_locale) cur_locale = setlocale(LC_CTYPE, NULL);
+#endif /* G_OS_WIN32 */
debug_print("current locale: %s\n",
cur_locale ? cur_locale : "(none)");
return cur_locale;
}
+gboolean conv_is_ja_locale(void)
+{
+ static gint is_ja_locale = -1;
+ const gchar *cur_locale;
+
+ if (is_ja_locale != -1)
+ return is_ja_locale != 0;
+
+ is_ja_locale = 0;
+ cur_locale = conv_get_current_locale();
+ if (cur_locale) {
+ if (g_ascii_strncasecmp(cur_locale, "ja", 2) == 0)
+ is_ja_locale = 1;
+ }
+
+ return is_ja_locale != 0;
+}
+
gchar *conv_unmime_header(const gchar *str, const gchar *default_encoding)
{
gchar buf[BUFFSIZE];
}
}
- if (conv_get_locale_charset() == C_EUC_JP)
+ if (conv_is_ja_locale())
conv_anytodisp(buf, sizeof(buf), str);
else
conv_localetodisp(buf, sizeof(buf), str);
} \
}
-void conv_encode_header(gchar *dest, gint len, const gchar *src,
- gint header_len, gboolean addr_field)
+void conv_encode_header_full(gchar *dest, gint len, const gchar *src,
+ gint header_len, gboolean addr_field,
+ const gchar *out_encoding_)
{
const gchar *cur_encoding;
const gchar *out_encoding;
}
cur_encoding = CS_INTERNAL;
- out_encoding = conv_get_outgoing_charset_str();
+
+ if (out_encoding_)
+ out_encoding = out_encoding_;
+ else
+ out_encoding = conv_get_outgoing_charset_str();
+
if (!strcmp(out_encoding, CS_US_ASCII))
out_encoding = CS_ISO_8859_1;
*destp = '\0';
}
+void conv_encode_header(gchar *dest, gint len, const gchar *src,
+ gint header_len, gboolean addr_field)
+{
+ conv_encode_header_full(dest,len,src,header_len,addr_field,NULL);
+}
+
#undef LBREAK_IF_REQUIRED
gchar *conv_filename_from_utf8(const gchar *utf8_file)
{