OSDN Git Service

implement seriesnum determinant system.
[rec10/rec10-git.git] / rec10 / trunk / src / guess.py
index 6416bd3..5e1f6ca 100644 (file)
@@ -1,7 +1,8 @@
+import os.path
 #!/usr/bin/python
 # coding: UTF-8
 # Rec10 TS Recording Tools
-# Copyright (C) 2009 Yukikaze
+# Copyright (C) 2009-2010 Yukikaze
 
 import os
 import re
@@ -9,35 +10,49 @@ import time
 import os
 import datetime
 import n_gram
+import recdblist
 import zenhan
+import auto_move
 
 def detName(title,path):
     tt=detNameType(title, path)
     if tt['type']=="C"or tt['type']=="D":
         tt['num']=detNum(tt['title'],tt['folder'])
+def detSeriesNum(execpath):
+    files=os.listdir(execpath)
+    ss={}
+    for file in files:
+        ftitle=os.path.splitext(file)
+        fname=ftitle[0]
+        fname=zenhan.toHankaku(unicode(name))
+        st=detNameType(fname, execpath)['title']
+        if not len(ss[st])>0:
+            ss[st]=[]
+        ss[detNum(fname,execpath)]=ftitle
+    return ss
 def detNum(title,movepath):
     """
-        #
+        #番組の話数を推測する。
     """
     files=os.listdir(movepath)
     ff=[]
     maxnum=0
     for file in files:
-        print file
+        recdblist.printutf8(file)
         file=os.path.join(movepath,file)
         if os.path.isfile(file):
             name=os.path.splitext(os.path.split(file)[1])
             name=name[0]
             name=zenhan.toHankaku(unicode(name))
             p1=detNameType(name,movepath)
-            print p1['title']+" "+str(p1['num'])
+            recdblist.printutf8(p1['title']+" "+str(p1['num']))
             time1=time.localtime(os.path.getmtime(file))
             time1=datetime.datetime.fromtimestamp(os.path.getmtime(file))
             if p1['num']!=-1:
                 ff.append([p1['num'],p1['title'],time1])
                 if maxnum<p1['num']+1:
                     maxnum=p1['num']+1
-    detMultiDeltaDays(ff)
+    return detMultiDeltaDays(ff)
 def detMultiDeltaDays(num_with_title_with_dates):
     maxnum=0
     for ft in num_with_title_with_dates:
@@ -55,13 +70,13 @@ def detMultiDeltaDays(num_with_title_with_dates):
             for ft3 in f3[i]:
                 for ft4 in f3[j]:
                     for gdd in detSingleDeltaDay(i, ft3[2], j, ft4[2]):
-                        print gdd
+                        #print gdd
                         if fret.get(gdd[0])!=None:
-                            print fret
+                            #print fret
                             fret[gdd[0]]=fret[gdd[0]]+gdd[1]
                         else:
                             fret[gdd[0]]=gdd[1]
-    print fret
+    #print fret
     maxk=0
     maxp=0
     for i in range(maxnum):
@@ -69,8 +84,8 @@ def detMultiDeltaDays(num_with_title_with_dates):
             if maxp<fret[i]:
                 maxk=i
                 maxp=fret[i]
-    print maxk
-    print maxp
+    #print maxk
+    #print maxp
     return maxk
 def detSingleDeltaDay(num1,date1,num2,date2):
     dd=date1-date2
@@ -91,7 +106,7 @@ def detSingleDeltaDay(num1,date1,num2,date2):
         dm=dm+d
     if dp%d*2>d:
         dp=dp+d
-    print str(d)+":"+str(dn)
+    recdblist.printutf8(str(d)+":"+str(dn))
     if dp!=dn:
         ret.append([dn/d,60])
         ret.append([dp/d,40])
@@ -110,7 +125,8 @@ def detNameType(title,path):
     type Aj ---title第<number>話
     path --search reflexively
     """
-    print title
+    recdblist.printutf8(title)
+    title=auto_move.getTitle(title)##titleから日時を除く
     #rA=re.compile(".+(?P<title>)#\d(?P<num>)\s[0,10]\z")
     rA=re.compile("(.+)#(\d*)\s*\Z")
     tA=rA.match(title)
@@ -120,26 +136,26 @@ def detNameType(title,path):
     tAj=rAj.match(title)
     ret={'title':"",'type':"",'num':0,'subtitle':"",'folder':""}
     if tA:
-        print "typeA"
-        print "title="+tA.group(1)
-        print "num="+tA.group(2)
+        recdblist.printutf8("typeA")
+        recdblist.printutf8("title="+tA.group(1))
+        recdblist.printutf8("num="+tA.group(2))
         ret['type']="A"
         ret['title']=tA.group(1)
         ret['num']=int(tA.group(2))
         ret['folder']=searchFolder(tA.group(1),path)
     if tAj:
-        print "typeA"
-        print "title="+tAj.group(1)
-        print "num="+tAj.group(2)
+        recdblist.printutf8("typeA")
+        recdblist.printutf8("title="+tAj.group(1))
+        recdblist.printutf8("num="+tAj.group(2))
         ret['type']="Aj"
         ret['title']=tAj.group(1)
         ret['num']=int(tAj.group(2))
         ret['folder']=searchFolder(tAj.group(1),path)
     elif tB:
-        print "typeB"
-        print "title="+tB.group(1)
-        print "num="+tB.group(2)
-        print "subtitle="+tB.group(3)
+        recdblist.printutf8("typeB")
+        recdblist.printutf8("title="+tB.group(1))
+        recdblist.printutf8("num="+tB.group(2))
+        recdblist.printutf8("subtitle="+tB.group(3))
         ret['type']="B"
         ret['title']=tB.group(1)
         ret['num']=int(tB.group(2))
@@ -153,18 +169,18 @@ def detNameType(title,path):
         for t in ts:
             tt=tt+" "+t
             ft1=searchFolder(tt,path)
-            print tt
-            print ft1
+            recdblist.printutf8(tt)
+            #print ft1
             if ft1!="":
-                #print rt
-                #print ft1[0]+" : "+str(ft1[1])
+                #recdblist.printutf8(rt)
+                #recdblist.printutf8(ft1[0]+" : "+str(ft1[1]))
                 if ft1[1]>rt[1]:
                     rt[0]=tt
                     rt[1]=ft1[1]
                     rt[2]=ft1[0]
-                    #print rt
-        #print "title="+rt[0][1:]+"/"
-        #print "subtitle = "+title.replace(rt[0][1:],"")[1:]
+                    #recdblist.printutf8(rt)
+        #recdblist.printutf8("title="+rt[0][1:]+"/")
+        #recdblist.printutf8("subtitle = "+title.replace(rt[0][1:],"")[1:])
         ret['title']=rt[0][1:]
         ret['num']=-1
         ret['folder']=rt[2]
@@ -174,7 +190,7 @@ def detNameType(title,path):
         else:
             ret['type']="C"
     return ret
-def searchFolder(title,path):
+def searchFolder(title,path,threshold=500):
     """
     titleからフォルダーを探す
     """
@@ -200,16 +216,18 @@ def searchFolder(title,path):
         else:
             cmpp=os.path.basename(dirp)
             appp=os.path.dirname(dirp)
-        p=n_gram.trigram(title.decode("utf-8"),cmpp.decode("utf-8"))
+        ntitle=auto_move.getTitle(title)
+        ncmpp=auto_move.getTitle(cmpp)
+        p=n_gram.trigram(ntitle,ncmpp)
         if p>0:
             ngram.append((p,appp))
     ngram=list(set(ngram))
     ngram.sort()
     ngram.reverse()
     if len(ngram)>0:
-        #print title + ngram[0][1] + " : "+str(ngram[0][0])
-        if ngram[0][0]>300:
-            return [ngram[0][1],ngram[0][0]]
+        #recdblist.printutf8(title + ngram[0][1] + " : "+str(ngram[0][0]))
+        if ngram[0][0]>threshold:
+            return ngram[0][1]
         else:
             return ""
     else: