File: import_google_userdict.py

package info (click to toggle)
sunpinyin 2.0.3%2Bgit20120607-1
  • links: PTS, VCS
  • area: main
  • in suites: wheezy
  • size: 1,372 kB
  • sloc: cpp: 14,549; python: 1,309; makefile: 154
file content (33 lines) | stat: -rwxr-xr-x 744 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
#!/usr/bin/python

import os, sys
import codecs
from importer import import_to_sunpinyin_user_dict

def load_google_user_dict (fname):
    result = []
    f = codecs.open (fname, "r", "GB18030")
    for l in f:
        v = l.strip().split()
        utf8str = v[0]

        try:
            freq = int(v[1])
            pystr = '\''.join (v[2:])
        except:
            pystr = '\''.join (v[1:])

        result.append ((pystr, utf8str))

    return result

def main ():
    if len (sys.argv) != 2:
        print "Please specify the Google Pinyin exported user dict file!"
        exit (1)

    google_user_dict = load_google_user_dict(sys.argv[1])
    import_to_sunpinyin_user_dict (google_user_dict)

if __name__ == "__main__":
    main()