X-Git-Url: http://git.osdn.net/view?a=blobdiff_plain;f=src%2Fjapanese.c;h=4e0c0b1a2ddcdcedf45d899e8b73b6c92e5d30ec;hb=b3317ce27a28a6d78ffccf52460ab56d95c83e09;hp=b746e11080ebf8eb6cd1bce0a6c30b3a77d72e8a;hpb=882170201699e6f4b6df149d31e1becd3cbf0415;p=hengband%2Fhengband.git diff --git a/src/japanese.c b/src/japanese.c index b746e1108..4e0c0b1a2 100644 --- a/src/japanese.c +++ b/src/japanese.c @@ -1,5 +1,8 @@ -/* File: japanese.c */ - +/*! + * @file japanese.c + * @brief 日本語処理関数 + * @date 2014/07/07 + */ #include "angband.h" @@ -9,64 +12,70 @@ typedef struct convert_key convert_key; struct convert_key { - cptr key1; - cptr key2; + concptr key1; + concptr key2; }; static const convert_key s2j_table[] = { {"mb","nb"}, {"mp","np"}, {"mv","nv"}, {"mm","nm"}, {"x","ks"}, - /* sindar:¥·¥ó¥À¡¼¥ë parantir:¥Ñ¥é¥ó¥Æ¥£¥¢ feanor:¥Õ¥§¥¢¥Î¡¼¥ë */ + /* sindar:シンダール parantir:パランティア feanor:フェアノール */ {"ar$","a-ru$"}, {"ir$","ia$"}, {"or$","o-ru$"}, - {"ra","¥é"}, {"ri","¥ê"}, {"ru","¥ë"}, {"re","¥ì"}, {"ro","¥í"}, - {"ir","ia"}, {"ur","ua"}, {"er","ea"}, {"ar","a¥ë"}, - {"sha","¥·¥ã"}, {"shi","¥·"}, {"shu","¥·¥å"}, {"she","¥·¥§"}, {"sho","¥·¥ç"}, - {"tha","¥µ"}, {"thi","¥·"}, {"thu","¥¹"}, {"the","¥»"}, {"tho","¥½"}, - {"cha","¥Ï"}, {"chi","¥Ò"}, {"chu","¥Õ"}, {"che","¥Ø"}, {"cho","¥Û"}, - {"dha","¥¶"}, {"dhi","¥¸"}, {"dhu","¥º"}, {"dhe","¥¼"}, {"dho","¥¾"}, - {"ba","¥Ð"}, {"bi","¥Ó"}, {"bu","¥Ö"}, {"be","¥Ù"}, {"bo","¥Ü"}, - {"ca","¥«"}, {"ci","¥­"}, {"cu","¥¯"}, {"ce","¥±"}, {"co","¥³"}, - {"da","¥À"}, {"di","¥Ç¥£"}, {"du","¥É¥¥"}, {"de","¥Ç"}, {"do","¥É"}, - {"fa","¥Õ¥¡"}, {"fi","¥Õ¥£"}, {"fu","¥Õ"}, {"fe","¥Õ¥§"}, {"fo","¥Õ¥©"}, - {"ga","¥¬"}, {"gi","¥®"}, {"gu","¥°"}, {"ge","¥²"}, {"go","¥´"}, - {"ha","¥Ï"}, {"hi","¥Ò"}, {"hu","¥Õ"}, {"he","¥Ø"}, {"ho","¥Û"}, - {"ja","¥¸¥ã"}, {"ji","¥¸"}, {"ju","¥¸¥å"}, {"je","¥¸¥§"}, {"jo","¥¸¥ç"}, - {"ka","¥«"}, {"ki","¥­"}, {"ku","¥¯"}, {"ke","¥±"}, {"ko","¥³"}, - {"la","¥é"}, {"li","¥ê"}, {"lu","¥ë"}, {"le","¥ì"}, {"lo","¥í"}, - {"ma","¥Þ"}, {"mi","¥ß"}, {"mu","¥à"}, {"me","¥á"}, {"mo","¥â"}, - {"na","¥Ê"}, {"ni","¥Ë"}, {"nu","¥Ì"}, {"ne","¥Í"}, {"no","¥Î"}, - {"pa","¥Ñ"}, {"pi","¥Ô"}, {"pu","¥×"}, {"pe","¥Ú"}, {"po","¥Ý"}, - {"qu","¥¯"}, - {"sa","¥µ"}, {"si","¥·"}, {"su","¥¹"}, {"se","¥»"}, {"so","¥½"}, - {"ta","¥¿"}, {"ti","¥Æ¥£"}, {"tu","¥È¥¥"}, {"te","¥Æ"}, {"to","¥È"}, - {"va","¥ô¥¡"}, {"vi","¥ô¥£"}, {"vu","¥ô"}, {"ve","¥ô¥§"}, {"vo","¥ô¥©"}, - {"wa","¥ï"}, {"wi","¥¦¥£"}, {"wu","¥¦"}, {"we","¥¦¥§"}, {"wo","¥¦¥©"}, - {"ya","¥ä"}, {"yu","¥æ"}, {"yo","¥è"}, - {"za","¥¶"}, {"zi","¥¸"}, {"zu","¥º"}, {"ze","¥¼"}, {"zo","¥¾"}, - {"dh","¥º"}, {"ch","¥Õ"}, {"th","¥¹"}, - {"b","¥Ö"}, {"c","¥¯"}, {"d","¥É"}, {"f","¥Õ"}, {"g","¥°"}, - {"h","¥Õ"}, {"j","¥¸¥å"}, {"k","¥¯"}, {"l","¥ë"}, {"m","¥à"}, - {"n","¥ó"}, {"p","¥×"}, {"q","¥¯"}, {"r","¥ë"}, {"s","¥¹"}, - {"t","¥È"}, {"v","¥ô"}, {"w","¥¦"}, {"y","¥¤"}, - {"a","¥¢"}, {"i","¥¤"}, {"u","¥¦"}, {"e","¥¨"}, {"o","¥ª"}, - {"-","¡¼"}, + {"ra","ラ"}, {"ri","リ"}, {"ru","ル"}, {"re","レ"}, {"ro","ロ"}, + {"ir","ia"}, {"ur","ua"}, {"er","ea"}, {"ar","aル"}, + {"sha","シャ"}, {"shi","シ"}, {"shu","シュ"}, {"she","シェ"}, {"sho","ショ"}, + {"tha","サ"}, {"thi","シ"}, {"thu","ス"}, {"the","セ"}, {"tho","ソ"}, + {"cha","ハ"}, {"chi","ヒ"}, {"chu","フ"}, {"che","ヘ"}, {"cho","ホ"}, + {"dha","ザ"}, {"dhi","ジ"}, {"dhu","ズ"}, {"dhe","ゼ"}, {"dho","ゾ"}, + {"ba","バ"}, {"bi","ビ"}, {"bu","ブ"}, {"be","ベ"}, {"bo","ボ"}, + {"ca","カ"}, {"ci","キ"}, {"cu","ク"}, {"ce","ケ"}, {"co","コ"}, + {"da","ダ"}, {"di","ディ"}, {"du","ドゥ"}, {"de","デ"}, {"do","ド"}, + {"fa","ファ"}, {"fi","フィ"}, {"fu","フ"}, {"fe","フェ"}, {"fo","フォ"}, + {"ga","ガ"}, {"gi","ギ"}, {"gu","グ"}, {"ge","ゲ"}, {"go","ゴ"}, + {"ha","ハ"}, {"hi","ヒ"}, {"hu","フ"}, {"he","ヘ"}, {"ho","ホ"}, + {"ja","ジャ"}, {"ji","ジ"}, {"ju","ジュ"}, {"je","ジェ"}, {"jo","ジョ"}, + {"ka","カ"}, {"ki","キ"}, {"ku","ク"}, {"ke","ケ"}, {"ko","コ"}, + {"la","ラ"}, {"li","リ"}, {"lu","ル"}, {"le","レ"}, {"lo","ロ"}, + {"ma","マ"}, {"mi","ミ"}, {"mu","ム"}, {"me","メ"}, {"mo","モ"}, + {"na","ナ"}, {"ni","ニ"}, {"nu","ヌ"}, {"ne","ネ"}, {"no","ノ"}, + {"pa","パ"}, {"pi","ピ"}, {"pu","プ"}, {"pe","ペ"}, {"po","ポ"}, + {"qu","ク"}, + {"sa","サ"}, {"si","シ"}, {"su","ス"}, {"se","セ"}, {"so","ソ"}, + {"ta","タ"}, {"ti","ティ"}, {"tu","トゥ"}, {"te","テ"}, {"to","ト"}, + {"va","ヴァ"}, {"vi","ヴィ"}, {"vu","ヴ"}, {"ve","ヴェ"}, {"vo","ヴォ"}, + {"wa","ワ"}, {"wi","ウィ"}, {"wu","ウ"}, {"we","ウェ"}, {"wo","ウォ"}, + {"ya","ヤ"}, {"yu","ユ"}, {"yo","ヨ"}, + {"za","ザ"}, {"zi","ジ"}, {"zu","ズ"}, {"ze","ゼ"}, {"zo","ゾ"}, + {"dh","ズ"}, {"ch","フ"}, {"th","ス"}, + {"b","ブ"}, {"c","ク"}, {"d","ド"}, {"f","フ"}, {"g","グ"}, + {"h","フ"}, {"j","ジュ"}, {"k","ク"}, {"l","ル"}, {"m","ム"}, + {"n","ン"}, {"p","プ"}, {"q","ク"}, {"r","ル"}, {"s","ス"}, + {"t","ト"}, {"v","ヴ"}, {"w","ウ"}, {"y","イ"}, + {"a","ア"}, {"i","イ"}, {"u","ウ"}, {"e","エ"}, {"o","オ"}, + {"-","ー"}, {NULL,NULL} }; -/* ¥·¥ó¥À¥ê¥ó¤òÆüËܸì¤ÎÆɤߤËÊÑ´¹¤¹¤ë */ -void sindarin_to_kana(char *kana, const char *sindarin) +/*! + * @brief シンダリンを日本語の読みに変換する + * @param kana 変換後の日本語文字列ポインタ + * @param sindarin 変換前のシンダリン文字列ポインタ + * @return なし + * @details + */ +void sindarin_to_kana(char *kana, concptr sindarin) { char buf[256]; int idx; sprintf(kana, "%s$", sindarin); for (idx = 0; kana[idx]; idx++) - if (isupper(kana[idx])) kana[idx] = tolower(kana[idx]); + if (isupper(kana[idx])) kana[idx] = (char)tolower(kana[idx]); for (idx = 0; s2j_table[idx].key1 != NULL; idx++) { - cptr pat1 = s2j_table[idx].key1; - cptr pat2 = s2j_table[idx].key2; + concptr pat1 = s2j_table[idx].key1; + concptr pat2 = s2j_table[idx].key2; int len = strlen(pat1); char *src = kana; char *dest = buf; @@ -105,128 +114,77 @@ void sindarin_to_kana(char *kana, const char *sindarin) } -/*ÆüËܸìÆ°»ì³èÍÑ (ÂǤġäÂǤäÆ,ÂǤÁ etc) */ - -#define CMPTAIL(y) strncmp(&in[l-(int)strlen(y)],y,strlen(y)) - -/* ²¥¤ë,½³¤ë¡ä²¥¤ê,½³¤ë */ -void jverb1( const char *in , char *out){ -int l=strlen(in); -strcpy(out,in); - -if( CMPTAIL("¤¹¤ë")==0) sprintf(&out[l-4],"¤·");else -if( CMPTAIL("¤¤¤ë")==0) sprintf(&out[l-4],"¤¤¤Æ");else - -if( CMPTAIL("¤¨¤ë")==0) sprintf(&out[l-4],"¤¨");else -if( CMPTAIL("¤±¤ë")==0) sprintf(&out[l-4],"¤±");else -if( CMPTAIL("¤²¤ë")==0) sprintf(&out[l-4],"¤²");else -if( CMPTAIL("¤»¤ë")==0) sprintf(&out[l-4],"¤»");else -if( CMPTAIL("¤¼¤ë")==0) sprintf(&out[l-4],"¤¼");else -if( CMPTAIL("¤Æ¤ë")==0) sprintf(&out[l-4],"¤Æ");else -if( CMPTAIL("¤Ç¤ë")==0) sprintf(&out[l-4],"¤Ç");else -if( CMPTAIL("¤Í¤ë")==0) sprintf(&out[l-4],"¤Í");else -if( CMPTAIL("¤Ø¤ë")==0) sprintf(&out[l-4],"¤Ø");else -if( CMPTAIL("¤Ù¤ë")==0) sprintf(&out[l-4],"¤Ù");else -if( CMPTAIL("¤á¤ë")==0) sprintf(&out[l-4],"¤á");else -if( CMPTAIL("¤ì¤ë")==0) sprintf(&out[l-4],"¤ì");else - -if( CMPTAIL("¤¦")==0) sprintf(&out[l-2],"¤¤");else -if( CMPTAIL("¤¯")==0) sprintf(&out[l-2],"¤­");else -if( CMPTAIL("¤°")==0) sprintf(&out[l-2],"¤®");else -if( CMPTAIL("¤¹")==0) sprintf(&out[l-2],"¤·");else -if( CMPTAIL("¤º")==0) sprintf(&out[l-2],"¤¸");else -if( CMPTAIL("¤Ä")==0) sprintf(&out[l-2],"¤Á");else -if( CMPTAIL("¤Å")==0) sprintf(&out[l-2],"¤Â");else -if( CMPTAIL("¤Ì")==0) sprintf(&out[l-2],"¤Ë");else -if( CMPTAIL("¤Õ")==0) sprintf(&out[l-2],"¤Ò");else -if( CMPTAIL("¤Ö")==0) sprintf(&out[l-2],"¤Ó");else -if( CMPTAIL("¤à")==0) sprintf(&out[l-2],"¤ß");else -if( CMPTAIL("¤ë")==0) sprintf(&out[l-2],"¤ê");else - - sprintf(&out[l],"¤½¤·¤Æ");} - -/* ²¥¤ë,½³¤ë> ²¥¤Ã¤Æ½³¤ë */ -void jverb2( const char *in , char *out){ -int l=strlen(in); -strcpy(out,in); - -if( CMPTAIL("¤¹¤ë")==0) sprintf(&out[l-4],"¤·¤Æ");else -if( CMPTAIL("¤¤¤ë")==0) sprintf(&out[l-4],"¤¤¤Æ");else - -if( CMPTAIL("¤¨¤ë")==0) sprintf(&out[l-4],"¤¨¤Æ");else -if( CMPTAIL("¤±¤ë")==0) sprintf(&out[l-4],"¤±¤Æ");else -if( CMPTAIL("¤²¤ë")==0) sprintf(&out[l-4],"¤²¤Æ");else -if( CMPTAIL("¤»¤ë")==0) sprintf(&out[l-4],"¤»¤Æ");else -if( CMPTAIL("¤¼¤ë")==0) sprintf(&out[l-4],"¤¼¤Æ");else -if( CMPTAIL("¤Æ¤ë")==0) sprintf(&out[l-4],"¤Æ¤Ã¤Æ");else -if( CMPTAIL("¤Ç¤ë")==0) sprintf(&out[l-4],"¤Ç¤Æ");else -if( CMPTAIL("¤Í¤ë")==0) sprintf(&out[l-4],"¤Í¤Æ");else -if( CMPTAIL("¤Ø¤ë")==0) sprintf(&out[l-4],"¤Ø¤Æ");else -if( CMPTAIL("¤Ù¤ë")==0) sprintf(&out[l-4],"¤Ù¤Æ");else -if( CMPTAIL("¤á¤ë")==0) sprintf(&out[l-4],"¤á¤Æ");else -if( CMPTAIL("¤ì¤ë")==0) sprintf(&out[l-4],"¤ì¤Æ");else - -if( CMPTAIL("¤¦")==0) sprintf(&out[l-2],"¤Ã¤Æ");else -if( CMPTAIL("¤¯")==0) sprintf(&out[l-2],"¤¤¤Æ");else -if( CMPTAIL("¤°")==0) sprintf(&out[l-2],"¤¤¤Ç");else -if( CMPTAIL("¤¹")==0) sprintf(&out[l-2],"¤·¤Æ");else -if( CMPTAIL("¤º")==0) sprintf(&out[l-2],"¤¸¤Æ");else -if( CMPTAIL("¤Ä")==0) sprintf(&out[l-2],"¤Ã¤Æ");else -if( CMPTAIL("¤Å")==0) sprintf(&out[l-2],"¤Ã¤Æ");else -if( CMPTAIL("¤Ì")==0) sprintf(&out[l-2],"¤Í¤Æ");else -if( CMPTAIL("¤Õ")==0) sprintf(&out[l-2],"¤Ø¤Æ");else -if( CMPTAIL("¤Ö")==0) sprintf(&out[l-2],"¤ó¤Ç");else -if( CMPTAIL("¤à")==0) sprintf(&out[l-2],"¤ó¤Ç");else -if( CMPTAIL("¤ë")==0) sprintf(&out[l-2],"¤Ã¤Æ");else - sprintf(&out[l],"¤³¤È¤Ë¤è¤ê");} - -/* ²¥¤ë,½³¤ë > ²¥¤Ã¤¿¤ê½³¤Ã¤¿¤ê */ -void jverb3( const char *in , char *out){ -int l=strlen(in); -strcpy(out,in); - -if( CMPTAIL("¤¹¤ë")==0) sprintf(&out[l-4],"¤·¤¿");else -if( CMPTAIL("¤¤¤ë")==0) sprintf(&out[l-4],"¤¤¤¿");else - -if( CMPTAIL("¤¨¤ë")==0) sprintf(&out[l-4],"¤¨¤¿");else -if( CMPTAIL("¤±¤ë")==0) sprintf(&out[l-4],"¤±¤¿");else -if( CMPTAIL("¤²¤ë")==0) sprintf(&out[l-4],"¤²¤¿");else -if( CMPTAIL("¤»¤ë")==0) sprintf(&out[l-4],"¤»¤¿");else -if( CMPTAIL("¤¼¤ë")==0) sprintf(&out[l-4],"¤¼¤¿");else -if( CMPTAIL("¤Æ¤ë")==0) sprintf(&out[l-4],"¤Æ¤Ã¤¿");else -if( CMPTAIL("¤Ç¤ë")==0) sprintf(&out[l-4],"¤Ç¤¿");else -if( CMPTAIL("¤Í¤ë")==0) sprintf(&out[l-4],"¤Í¤¿");else -if( CMPTAIL("¤Ø¤ë")==0) sprintf(&out[l-4],"¤Ø¤¿");else -if( CMPTAIL("¤Ù¤ë")==0) sprintf(&out[l-4],"¤Ù¤¿");else -if( CMPTAIL("¤á¤ë")==0) sprintf(&out[l-4],"¤á¤¿");else -if( CMPTAIL("¤ì¤ë")==0) sprintf(&out[l-4],"¤ì¤¿");else - -if( CMPTAIL("¤¦")==0) sprintf(&out[l-2],"¤Ã¤¿");else -if( CMPTAIL("¤¯")==0) sprintf(&out[l-2],"¤¤¤¿");else -if( CMPTAIL("¤°")==0) sprintf(&out[l-2],"¤¤¤À");else -if( CMPTAIL("¤¹")==0) sprintf(&out[l-2],"¤·¤¿");else -if( CMPTAIL("¤º")==0) sprintf(&out[l-2],"¤¸¤¿");else -if( CMPTAIL("¤Ä")==0) sprintf(&out[l-2],"¤Ã¤¿");else -if( CMPTAIL("¤Å")==0) sprintf(&out[l-2],"¤Ã¤¿");else -if( CMPTAIL("¤Ì")==0) sprintf(&out[l-2],"¤Í¤¿");else -if( CMPTAIL("¤Õ")==0) sprintf(&out[l-2],"¤Ø¤¿");else -if( CMPTAIL("¤Ö")==0) sprintf(&out[l-2],"¤ó¤À");else -if( CMPTAIL("¤à")==0) sprintf(&out[l-2],"¤ó¤À");else -if( CMPTAIL("¤ë")==0) sprintf(&out[l-2],"¤Ã¤¿");else - sprintf(&out[l],"¤³¤È¤ä");} - - -void jverb( const char *in , char *out , int flag){ - switch (flag){ - case JVERB_AND:jverb1(in , out);break; - case JVERB_TO :jverb2(in , out);break; - case JVERB_OR :jverb3(in , out);break; - } -} +/*! 日本語動詞活用 (打つ>打って,打ち etc) + * JVERB_AND: 殴る,蹴る > 殴り,蹴る + * JVERB_TO: 殴る,蹴る > 殴って蹴る + * JVERB_OR: 殴る,蹴る > 殴ったり蹴ったり */ +static const struct jverb_table_t { + const char* from; + const char* to[3]; +} jverb_table[] = { + { "する", {"し", "して", "した"}}, + { "いる", {"いて", "いて", "いた"}}, + + { "える", {"え", "えて", "えた"}}, + { "ける", {"け", "けて", "けた"}}, + { "げる", {"げ", "えて", "げた"}}, + { "せる", {"せ", "せて", "せた"}}, + { "ぜる", {"ぜ", "ぜて", "ぜた"}}, + { "てる", {"て", "てって", "てった"}}, + { "でる", {"で", "でて", "でた"}}, + { "ねる", {"ね", "ねて", "ねた"}}, + { "へる", {"へ", "へて", "へた"}}, + { "べる", {"べ", "べて", "べた"}}, + { "める", {"め", "めて", "めた"}}, + { "れる", {"れ", "れて", "れた"}}, + + { "う", {"い", "って", "った"}}, + { "く", {"き", "いて", "いた"}}, + { "ぐ", {"ぎ", "いで", "いだ"}}, + { "す", {"し", "して", "した"}}, + { "ず", {"じ", "じて", "じた"}}, + { "つ", {"ち", "って", "った"}}, + { "づ", {"ぢ", "って", "った"}}, + { "ぬ", {"に", "ねて", "ねた"}}, + { "ふ", {"ひ", "へて", "へた"}}, + { "ぶ", {"び", "んで", "んだ"}}, + { "む", {"み", "んで", "んだ"}}, + { "る", {"り", "って", "った"}}, + { NULL, {"そして", "ことにより", "ことや"}}, +}; + +/*! + * @brief jverb_table_tに従って動詞を活用する + * @param in 変換元文字列ポインタ + * @param out 変換先文字列ポインタ + * @param flag 変換種類を指定(JVERB_AND/JVERB_TO/JVERB_OR) + * @return なし + * @details + */ +void jverb(concptr in, char *out, int flag) +{ + const struct jverb_table_t * p; + int in_len = strlen(in); + strcpy(out, in); -/* - * Convert SJIS string to EUC string + for (p = jverb_table; p->from; p++) { + int from_len = strlen(p->from); + if (strncmp(&in[in_len-from_len], p->from, from_len) == 0) { + strcpy(&out[in_len - from_len], p->to[flag - 1]); + break; + } + } + + if (p->from == NULL) + strcpy(&out[in_len], p->to[flag - 1]); +} + +/*! + * @brief 文字コードをSJISからEUCに変換する / Convert SJIS string to EUC string + * @param str 変換する文字列のポインタ + * @return なし + * @details */ void sjis2euc(char *str) { @@ -268,8 +226,11 @@ void sjis2euc(char *str) } -/* - * Convert EUC string to SJIS string +/*! + * @brief 文字コードをEUCからSJISに変換する / Convert EUC string to SJIS string + * @param str 変換する文字列のポインタ + * @return なし + * @details */ void euc2sjis(char *str) { @@ -312,14 +273,14 @@ void euc2sjis(char *str) } -/* - * str¤ò´Ä¶­¤Ë¹ç¤Ã¤¿Ê¸»ú¥³¡¼¥É¤ËÊÑ´¹¤·¡¢ÊÑ´¹Á°¤Îʸ»ú¥³¡¼¥É¤òÊÖ¤¹¡£ - * str¤ÎŤµ¤ËÀ©¸Â¤Ï¤Ê¤¤¡£ - * - * 0: Unknown - * 1: ASCII (Never known to be ASCII in this function.) - * 2: EUC - * 3: SJIS +/*! + * @brief strを環境に合った文字コードに変換し、変換前の文字コードを返す。strの長さに制限はない。 + * @param str 変換する文字列のポインタ + * @return + * 0: Unknown
+ * 1: ASCII (Never known to be ASCII in this function.)
+ * 2: EUC
+ * 3: SJIS
*/ byte codeconv(char *str) { @@ -403,8 +364,13 @@ byte codeconv(char *str) return code; } -/* ʸ»úÎós¤Îx¥Ð¥¤¥ÈÌܤ¬´Á»ú¤Î1¥Ð¥¤¥ÈÌܤ«¤É¤¦¤«È½Äꤹ¤ë */ -bool iskanji2(cptr s, int x) +/*! + * @brief 文字列sのxバイト目が漢字の1バイト目かどうか判定する + * @param s 判定する文字列のポインタ + * @param x 判定する位置(バイト) + * @return 漢字の1バイト目ならばTRUE + */ +bool iskanji2(concptr s, int x) { int i; @@ -417,5 +383,156 @@ bool iskanji2(cptr s, int x) return FALSE; } -#endif /* JP */ +/*! + * @brief 文字列の文字コードがASCIIかどうかを判定する + * @param str 判定する文字列へのポインタ + * @return 文字列の文字コードがASCIIならTRUE、そうでなければFALSE + */ +static bool is_ascii_str(concptr str) +{ + for (;*str; str++) { + if (!(0x00 < *str && *str <= 0x7f)) + return FALSE; + } + return TRUE; +} + +/*! + * @brief 文字列の文字コードがUTF-8かどうかを判定する + * @param str 判定する文字列へのポインタ + * @return 文字列の文字コードがUTF-8ならTRUE、そうでなければFALSE + */ +static bool is_utf8_str(concptr str) +{ + const unsigned char* p; + for (p = (const unsigned char*)str; *p; p++) { + int subseq_num = 0; + if (0x00 < *p && *p <= 0x7f) continue; + + if ((*p & 0xe0) == 0xc0) subseq_num = 1; + if ((*p & 0xf0) == 0xe0) subseq_num = 2; + if ((*p & 0xf8) == 0xf0) subseq_num = 3; + + if (subseq_num == 0) return FALSE; + while (subseq_num--) { + p++; + if (!*p || (*p & 0xc0) != 0x80) return FALSE; + } + } + return TRUE; +} + +#if defined(EUC) +#include + +static const struct ms_to_jis_unicode_conv_t { + char from[3]; + char to[3]; +} ms_to_jis_unicode_conv[] = { + {{0xef, 0xbd, 0x9e}, {0xe3, 0x80, 0x9c}}, /* FULLWIDTH TILDE -> WAVE DASH */ + {{0xef, 0xbc, 0x8d}, {0xe2, 0x88, 0x92}}, /* FULLWIDTH HYPHEN-MINUS -> MINUS SIGN */ +}; + +/*! + * @brief EUCがシステムコードである環境下向けにUTF-8から変換処理を行うサブルーチン + * @param str 変換する文字列のポインタ + * @return なし + */ +static void ms_to_jis_unicode(char* str) +{ + unsigned char* p; + for (p = (unsigned char*)str; *p; p++) { + int subseq_num = 0; + if (0x00 < *p && *p <= 0x7f) continue; + + if ((*p & 0xe0) == 0xc0) subseq_num = 1; + if ((*p & 0xf0) == 0xe0) { + int i; + for (i = 0; i < sizeof(ms_to_jis_unicode_conv) / sizeof(ms_to_jis_unicode_conv[0]); ++ i) { + const struct ms_to_jis_unicode_conv_t *c = &ms_to_jis_unicode_conv[i]; + if (memcmp(p, c->from, 3) == 0) { + memcpy(p, c->to, 3); + } + } + subseq_num = 2; + } + if ((*p & 0xf8) == 0xf0) subseq_num = 3; + + p += subseq_num; + } +} + +#elif defined(SJIS) && defined(WINDOWS) +#include +#endif +/*! + * @brief 文字コードがUTF-8の文字列をシステムの文字コードに変換する + * @param utf8_str 変換するUTF-8の文字列へのポインタ + * @param sys_str_buffer 変換したシステムの文字コードの文字列を格納するバッファへのポインタ + * @param sys_str_buflen 変換したシステムの文字コードの文字列を格納するバッファの長さ + * @return 変換に成功した場合TRUE、失敗した場合FALSEを返す + */ +static bool utf8_to_sys(char* utf8_str, char* sys_str_buffer, size_t sys_str_buflen) +{ +#if defined(EUC) + + iconv_t cd = iconv_open("EUC-JP", "UTF-8"); + size_t utf8_len = strlen(utf8_str) + 1; /* include termination character */ + char *from = utf8_str; + int ret; + + ms_to_jis_unicode(utf8_str); + ret = iconv(cd, &from, &utf8_len, &sys_str_buffer, &sys_str_buflen); + iconv_close(cd); + return (ret >= 0); + +#elif defined(SJIS) && defined(WINDOWS) + + LPWSTR utf16buf; + int input_len = strlen(utf8_str) + 1; /* include termination character */ + + C_MAKE(utf16buf, input_len, WCHAR); + /* UTF-8 -> UTF-16 */ + if (MultiByteToWideChar( CP_UTF8, 0, utf8_str, input_len, utf16buf, input_len) == 0) { + C_KILL(utf16buf, input_len, WCHAR); + return FALSE; + } + + /* UTF-8 -> SJIS(CP932) */ + if (WideCharToMultiByte( CP_ACP, 0, utf16buf, -1, sys_str_buffer, sys_str_buflen, NULL, NULL ) == 0) { + C_KILL(utf16buf, input_len, WCHAR); + return FALSE; + } + + C_KILL(utf16buf, input_len, WCHAR); + return TRUE; + +#endif +} + +/*! + * @brief 受け取った文字列の文字コードを推定し、システムの文字コードへ変換する + * @param strbuf 変換する文字列を格納したバッファへのポインタ。 + * バッファは変換した文字列で上書きされる。 + * UTF-8からSJISもしくはEUCへの変換を想定しているのでバッファの長さが足りなくなることはない。 + * @param buflen バッファの長さ。 + * @return なし + */ +void guess_convert_to_system_encoding(char* strbuf, int buflen) +{ + if (is_ascii_str(strbuf)) return; + + if (is_utf8_str(strbuf)) { + char* work; + C_MAKE(work, buflen, char); + my_strcpy(work, strbuf, buflen); + if (!utf8_to_sys(work, strbuf, buflen)) { + msg_print("警告:文字コードの変換に失敗しました"); + msg_print(NULL); + } + C_KILL(work, buflen, char); + } +} + +#endif /* JP */