#!/usr/bin/python
# coding: UTF-8
# Rec10 TS Recording Tools
-# Copyright (C) 2009 Yukikaze
+# Copyright (C) 2009-2010 Yukikaze
+import recdblist
global z_ascii
global h_ascii
global z_number
global h_number
-z_ascii=u"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz !”#$%&’()*+,−./:;<=>?@[¥]^_‘{|}〜 "
-h_ascii=u"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz !\"#$%&'()*+,-./:;<=>?@[\]^_`{|}~ "
-z_number=u"0123456789"
-h_number=u"0123456789"
-z_alphabet=u"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz #"
-h_alphabet=u"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz #"
+z_ascii = u"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz !”#$%&’()*+,−./:;<=>?@[¥]^_‘{|}〜 〜"
+h_ascii = u"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz !\"#$%&'()*+,-./:;<=>?@[\]^_`{|}~ -"
+#z_ascii = z_ascii+Ur"\Ue28892\Uefbc8e"
+#h_ascii = h_ascii+Ur"\Uefbc8d."
+z_ascii_sp = unichr(0x2212)+unichr(0xff0e)
+h_ascii_sp = unichr(0x002d)+unichr(0x002e)
+z_number = u"0123456789"
+h_number = u"0123456789"
+z_alphabet = u"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz #"
+h_alphabet = u"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz #"
def toHankaku(str):
- retstr=u""
+ retstr = u""
for s in str:
- i=z_ascii.find(s)
+ i = z_ascii.find(s)
if (i != -1):
- s=h_ascii[i]
- i=z_number.find(s)
+ s = h_ascii[i]
+ i = z_ascii_sp.find(s)
if (i != -1):
- s=h_number[i]
- retstr=retstr+s
+ s = h_ascii_sp[i]
+ i = z_number.find(s)
+ if (i != -1):
+ s = h_number[i]
+ retstr = retstr + s
return retstr
def toHankaku_ABC123(str):
- retstr=u""
+ retstr = u""
for s in str:
- i=z_alphabet.find(s)
+ i = z_alphabet.find(s)
+ if (i != -1):
+ s = h_alphabet[i]
+ i = z_ascii_sp.find(s)
if (i != -1):
- s=h_alphabet[i]
- i=z_number.find(s)
+ s = h_ascii_sp[i]
+ i = z_number.find(s)
if (i != -1):
- s=h_number[i]
- retstr=retstr+s
+ s = h_number[i]
+ retstr = retstr + s
return retstr
-
+def check_Character_Type(character):
+ """
+ return code is 1:Alphabet 2:Hiragana 3:Katakana 4:Kanji
+ """
+ #recdblist.printutf8(character)
+ #recdblist.printutf8(type(character))
+ #character=character.encode('UTF-8')
+ #recdblist.printutf8(character)
+ #recdblist.printutf8(type(character))
+ chcode=ord(character)
+ #recdblist.printutf8(ord(chcode))
+ if chcode>=0x0000 and chcode<=0x007F:
+ return 1
+ elif chcode>=0x3040 and chcode<=0x309F:
+ return 2
+ elif chcode>=0x30A0 and chcode<=0x30FF:
+ return 3
+ elif chcode>=0x4E00 and chcode<=0x9FFF:
+ return 4