ti34973 fixed

author Takuya Nishimoto <nishimotz@gmail.com>

Thu, 12 Mar 2015 14:00:08 +0000 (23:00 +0900)

committer Takuya Nishimoto <nishimotz@gmail.com>

Thu, 12 Mar 2015 14:00:08 +0000 (23:00 +0900)
author Takuya Nishimoto <nishimotz@gmail.com>
Thu, 12 Mar 2015 14:00:08 +0000 (23:00 +0900)
committer Takuya Nishimoto <nishimotz@gmail.com>
Thu, 12 Mar 2015 14:00:08 +0000 (23:00 +0900)
diff --git a/include/jtalk/custom_dic_maker.py b/include/jtalk/custom_dic_maker.py

index 02bd995..cb2104d 100644 (file)
--- a/include/jtalk/custom_dic_maker.py
+++ b/include/jtalk/custom_dic_maker.py
@@ -307,7 +307,42 @@ jdic = [
          'speech':'トーキング',\r
          'accent':'1/5',\r
          },\r
-\r
+       {'text':'（日）',\r
+        'speech':'（ニチ）',\r
+        'braille':'（ニチ）',\r
+        'accent':"1/2",\r
+        'cost':1345,\r
+        'pos':"名詞,一般,*,*,*,*"\r
+        },\r
+       {'text':'（月）',\r
+        'speech':'（ゲツ）',\r
+        'braille':'（ゲツ）',\r
+        'accent':"1/2",\r
+        'cost':1345,\r
+        'pos':"名詞,一般,*,*,*,*"\r
+        },\r
+       {'text':'（火）',\r
+        'speech':'（カ）',\r
+        'braille':'（カ）',\r
+        'accent':"1/1",\r
+        'cost':1345,\r
+        'pos':"名詞,一般,*,*,*,*"\r
+        },\r
+       {'text':'（水）',\r
+        'speech':'（スイ）',\r
+        'braille':'（スイ）',\r
+        'accent':"1/2",\r
+        'cost':1345,\r
+        'pos':"名詞,一般,*,*,*,*"\r
+        },\r
+       {'text':'（木）',\r
+        'speech':'（モク）',\r
+        'braille':'（モク）',\r
+        'accent':"1/2",\r
+        'cost':1345,\r
+        'pos':"名詞,一般,*,*,*,*"\r
+        },\r
+       \r
  #      ['きゃ', 'キャ',            "1/1",          15000,          "記号,一般,*,*,*,*"],\r
  #      ['きゅ', 'キュ',            "1/1",          15000,          "記号,一般,*,*,*,*"],\r
  #      ['きょ', 'キョ',            "1/1",          15000,          "記号,一般,*,*,*,*"],\r
diff --git a/jptools/harness.py b/jptools/harness.py

index d112f83..c6fb28b 100644 (file)
--- a/jptools/harness.py
+++ b/jptools/harness.py
@@ -178,9 +178,43 @@ tests = [
                 'text': '(日)',\r
                 'input': '(ニチ)',\r
                 'output': '⠶⠇⠗⠶',\r
-               'inpos2': [0,1,2],\r
+               'inpos2': [0,1,1,2],\r
                 'inpos1': [0,1,2,3],\r
-               'inpos':  [0,1,1,1,2],\r
+               'inpos':  [0,1,1,2],\r
+               'comment': 'nvdajp ticket34973',\r
+       },\r
+       {\r
+               'text': '(月)',\r
+               'input': '(ゲツ)',\r
+               'comment': 'nvdajp ticket34973',\r
+       },\r
+       {\r
+               'text': '(火)',\r
+               'input': '(カ)',\r
+               'output': '⠶⠡⠶',\r
+               'inpos2': [0,1,2],\r
+               'inpos1': [0,1,2],\r
+               'inpos':  [0,1,2],\r
+               'comment': 'nvdajp ticket34973',\r
+       },\r
+       {\r
+               'text': '(水)',\r
+               'input': '(スイ)',\r
+               'comment': 'nvdajp ticket34973',\r
+       },\r
+       {\r
+               'text': '(木)',\r
+               'input': '(モク)',\r
+               'comment': 'nvdajp ticket34973',\r
+       },\r
+       {\r
+               'text': '(金)',\r
+               'input': '(キン)',\r
+               'comment': 'nvdajp ticket34973',\r
+       },\r
+       {\r
+               'text': '(土)',\r
+               'input': '(ド)',\r
                 'comment': 'nvdajp ticket34973',\r
         },\r
         {\r
diff --git a/source/synthDrivers/jtalk/translator2.py b/source/synthDrivers/jtalk/translator2.py

index 96d752c..d02f14a 100644 (file)
--- a/source/synthDrivers/jtalk/translator2.py
+++ b/source/synthDrivers/jtalk/translator2.py
@@ -79,6 +79,31 @@ CONNECTED_MORPHS = {
                 ['なく', 'ナク', '2/2', None, None, None],\r
                 ['なる', 'ナル', '1/2', '動詞', '自立', None],\r
                 ],\r
+       '（日）': [\r
+               ['（', '(', '*/*', '記号', '括弧開', '*'],\r
+               ['日', 'ニチ', '1/2', '名詞', '一般', None],\r
+               ['）', ')', '*/*', '記号', '括弧閉', '*'],\r
+               ],\r
+       '（月）': [\r
+               ['（', '(', '*/*', '記号', '括弧開', '*'],\r
+               ['月', 'ゲツ', '1/2', '名詞', '一般', None],\r
+               ['）', ')', '*/*', '記号', '括弧閉', '*'],\r
+               ],\r
+       '（火）': [\r
+               ['（', '(', '*/*', '記号', '括弧開', '*'],\r
+               ['火', 'カ', '1/1', '名詞', '一般', None],\r
+               ['）', ')', '*/*', '記号', '括弧閉', '*'],\r
+               ],\r
+       '（水）': [\r
+               ['（', '(', '*/*', '記号', '括弧開', '*'],\r
+               ['水', 'スイ', '1/2', '名詞', '一般', None],\r
+               ['）', ')', '*/*', '記号', '括弧閉', '*'],\r
+               ],\r
+       '（木）': [\r
+               ['（', '(', '*/*', '記号', '括弧開', '*'],\r
+               ['木', 'モク', '1/2', '名詞', '一般', None],\r
+               ['）', ')', '*/*', '記号', '括弧閉', '*'],\r
+               ],\r
  }\r
  \r
  class MecabMorph(object):\r
@@ -166,12 +191,12 @@ def mecab_to_morphs(mf):
                         if len(ar) > 7:\r
                                 mo.kihon = ar[7]\r
                         if len(ar) > 9:\r
-                               mo.kana = ar[8]\r
-                               mo.yomi = ar[9]\r
+                               mo.kana = unicode_normalize(ar[8]) # "（ニチ）" -> "(ニチ)"\r
+                               mo.yomi = unicode_normalize(ar[9])\r
                                 mo.accent = ar[10]\r
                                 if len(ar) > 12:\r
                                         # Mecab辞書の拡張フィールドの点訳表記があれば使用する\r
-                                       mo.output = ar[12]\r
+                                       mo.output = unicode_normalize(ar[12])\r
                                 else:\r
                                         mo.output = ar[9]\r
                                         update_phonetic_symbols(mo)\r
@@ -186,11 +211,13 @@ def replace_morphs(li, dic):
                         new_morphs = dic[mo.hyouki]\r
                         for i in new_morphs:\r
                                 m = copy.deepcopy(mo)\r
-                               m.hyouki = m.nhyouki = i[0] # に\r
+                               m.hyouki = i[0] # に\r
+                               m.nhyouki = unicode_normalize(i[0]) # に\r
                                 if i[3]: m.hinshi1 = i[3]\r
                                 if i[4]: m.hinshi2 = i[4]\r
                                 if i[5]: m.hinshi3 = i[5]\r
-                               m.output = m.kana = m.yomi = i[1] # ニ\r
+                               m.kana = i[0]\r
+                               m.output = m.yomi = unicode_normalize(i[1]) # ニ\r
                                 m.accent = i[2] # 0/1\r
                                 new_li.append(m)\r
                 else:\r
author	Takuya Nishimoto <nishimotz@gmail.com>
	Thu, 12 Mar 2015 14:00:08 +0000 (23:00 +0900)
committer	Takuya Nishimoto <nishimotz@gmail.com>
	Thu, 12 Mar 2015 14:00:08 +0000 (23:00 +0900)
include/jtalk/custom_dic_maker.py		patch \| blob \| history
jptools/harness.py		patch \| blob \| history
source/synthDrivers/jtalk/translator2.py		patch \| blob \| history