3 # Rec10 TS Recording Tools
4 # Copyright (C) 2009 Yukikaze
7 def bigram(str1, str2):
8 str1 = zenhan.toHankaku(str1)
9 str2 = zenhan.toHankaku(str2)
10 str1 = str1.replace(" ", "")
11 str2 = str2.replace(" ", "")
25 i = find_gram(x, str2)
32 def trigram(str1, str2):
33 str1 = zenhan.toHankaku(str1)
34 str2 = zenhan.toHankaku(str2)
35 str1 = str1.replace(" ", "")
36 str2 = str2.replace(" ", "")
38 trigramによる単語の近さを計算します。
47 gram.append(tmp1 + tmp2 + x)
53 i = find_gram(x, str2)
60 point = point + 20*count*count
61 point = point / len(str1) * 10
62 point = point / len(str2) * 10
64 def find_gram(gram, s):
70 while st.find(gram) != -1:
72 st = st[st.find(gram) + 1:]
74 def get_noun_quad_gram(s):
75 str1 = zenhan.toHankaku(s)
77 trigramによる単語の近さを計算します。
85 tmps=tmp1 + tmp2 + tmp3 + x
86 if tmps.find(" ")==-1:
87 if (zenhan.check_Character_Type(tmp1)==zenhan.check_Character_Type(tmp2))and(zenhan.check_Character_Type(tmp2)==zenhan.check_Character_Type(tmp3))and(zenhan.check_Character_Type(tmp3)==zenhan.check_Character_Type(x)):
88 if gram.has_key(tmps):
89 gram[tmps]=gram[tmps]+1