From aed5a2f2fcc5530d216915544b592f5ec0748a3c Mon Sep 17 00:00:00 2001 From: evgeny Date: Fri, 23 Sep 2011 01:00:51 +0400 Subject: [PATCH] modified src/strokes.txt --- data/all.sh | 9 +++++++++ data/convert.py | 4 ++-- data/merge.py | 1 + data/merge.sh | 2 +- data/sort.sh | 2 +- data/strokes.txt.bak | Bin 78576 -> 78608 bytes src/strokes.txt | Bin 259968 -> 259968 bytes 7 files changed, 14 insertions(+), 4 deletions(-) create mode 100755 data/all.sh mode change 100755 => 100644 data/strokes.txt.bak diff --git a/data/all.sh b/data/all.sh new file mode 100755 index 0000000..8befdc5 --- /dev/null +++ b/data/all.sh @@ -0,0 +1,9 @@ +#!/usr/bin/env sh + +./convert.py handwriting-ja.xml +./sort.sh tomoe.utf16 +./sort.sh strokes.txt.bak +./merge.sh strokes.txt.bak.sorted tomoe.utf16.sorted +rm *sorted *utf16 +./sort.sh output.txt +mv output.txt.sorted output.txt diff --git a/data/convert.py b/data/convert.py index 74872a7..b34ca8e 100755 --- a/data/convert.py +++ b/data/convert.py @@ -6,7 +6,7 @@ import codecs from math import acos, pi if len(sys.argv) < 2: - print("Usage: %s" % sys.argv[0]) + print("Usage: %s handwriting-ja.xml" % sys.argv[0]) sys.exit(1) class pt: @@ -51,7 +51,7 @@ def get_chr(pts, cap = False): return ret f = open(sys.argv[1]) -fo = open("tomoe", 'wb') +fo = open("tomoe.utf16", 'wb') fo.write(codecs.BOM_UTF16_LE) k = None pts = [] diff --git a/data/merge.py b/data/merge.py index 5367b9e..b9a114e 100755 --- a/data/merge.py +++ b/data/merge.py @@ -61,3 +61,4 @@ fo = open("merged.txt.utf8", 'w') for i in l1: fo.write(i) fo.close() + diff --git a/data/merge.sh b/data/merge.sh index 80d0fa0..6e7a0e4 100755 --- a/data/merge.sh +++ b/data/merge.sh @@ -6,5 +6,5 @@ iconv -f UTF16LE -t UTF8 $2 > $2.utf8 shopt -s xpg_echo echo '\x0A\x0A\c' >> merged.txt.utf8 crlf -d merged.txt.utf8 -(echo '\xFF\xFE\c' & iconv -f UTF8 -t UTF16LE merged.txt.utf8) > merged.txt +(echo '\xFF\xFE\c' & iconv -f UTF8 -t UTF16LE merged.txt.utf8) > output.txt rm *.utf8 diff --git a/data/sort.sh b/data/sort.sh index 5f5d913..81557b5 100755 --- a/data/sort.sh +++ b/data/sort.sh @@ -5,5 +5,5 @@ iconv -f UTF16LE -t UTF8 $1 > $1.utf8 shopt -s xpg_echo echo '\x0A\x0A\c' >> $1.utf8_sorted crlf -d $1.utf8_sorted -(echo '\xFF\xFE\c' & iconv -f UTF8 -t UTF16LE $1.utf8_sorted) > out.txt +(echo '\xFF\xFE\c' & iconv -f UTF8 -t UTF16LE $1.utf8_sorted) > $1.sorted rm *.utf8 *_sorted diff --git a/data/strokes.txt.bak b/data/strokes.txt.bak old mode 100755 new mode 100644 index ec276082e2ec94277595c3b73d6ac9b49d91ff99..137f62afe41e585242d93c6bc63a935035373032 GIT binary patch delta 30 mcmezHlx4y*mJK@^xIgDQGdMGNGB`1~O}_X-c=NUft4#pY!woV3 delta 14 WcmbR6jOD{qmJK@^Hs5Hl*aQGRI|wlV diff --git a/src/strokes.txt b/src/strokes.txt index 9abea7c3ba938dc29ef980cd0b65e72256463a67..d2bd1c632838d29a65137edac35c5870d23b8b2d 100644 GIT binary patch delta 50 zcmZp8&)@K#e}fkDW*z3ff9#)gof(`NJg3_yGl_5C!N?fF+-|_i2*ga=4Op22J~2r# F007EV4`cuU delta 47 zcmZp8&)@K#e}fh?W8!8_=Kg=%Z!j{3F|&Tob!KpzzL$|vx?PWz5r~<#>#;Hid;$QV CGY^*l -- 2.11.0