starting to write pinyinizer

master
Dario Ernst 14 years ago
parent e56b2b931e
commit f9685346ce

@ -0,0 +1,53 @@
import sqlite3
import sys
import os
import re
if len(sys.argv) != 3:
print "Usage: cedict2sqlite [hanzi-text or file] [sqlite-file.sqlite]"
exit
hanzitf=sys.argv[1]
sqlitef=sys.argv[2]
if os.path.exists(hanzitf):
hanzi = open(hanzitf,"r").read()
else:
hanzi = hanzitf
hanzi.strip().lower()
if not os.path.exists(sqlitef):
print "sqlite database file not found"
sys.exit()
slconn = sqlite3.connect(sqlitef)
hzwork = list(hanzi.decode("UTF-8"))
finres = ""
while hzwork:
print "\nhzwork still %s"%hzwork
tmpstr = ""
lastres = ""
for c in hzwork:
tmpstr += hzwork[0]
print "checking for %s (%s)"%(tmpstr,tmpstr.__repr__())
res = slconn.execute('SELECT pinyin FROM entries WHERE simplified="%s"'%tmpstr).fetchall()
if res != []:
lastres = res[0][0]
hzwork.pop(0)
print "found and consumed %s"%res[0][0]
else:
print "got empty result, breaking"
break
finres += lastres+" "
print "appending and deleting lastres %s, finres now: %s"%(lastres,finres)
print "\nfinished with: %s\n"%finres
Loading…
Cancel
Save