diff options
author | Peng Wu <alexepico@gmail.com> | 2013-02-01 10:54:38 +0800 |
---|---|---|
committer | Peng Wu <alexepico@gmail.com> | 2013-02-01 10:54:38 +0800 |
commit | df43ebb8360fa5fafe801e01e7f2f6195d2b137a (patch) | |
tree | ab54df6f741822ee31615ca13293bab361ddb2b5 | |
parent | aa75fc05cced38be5bee6d4b8cc572859d3761c8 (diff) | |
download | trainer-df43ebb8360fa5fafe801e01e7f2f6195d2b137a.tar.gz trainer-df43ebb8360fa5fafe801e01e7f2f6195d2b137a.tar.xz trainer-df43ebb8360fa5fafe801e01e7f2f6195d2b137a.zip |
fixes bugs
-rw-r--r-- | tools/merge.py | 8 |
1 files changed, 4 insertions, 4 deletions
diff --git a/tools/merge.py b/tools/merge.py index c018bfe..cc90dc2 100644 --- a/tools/merge.py +++ b/tools/merge.py @@ -12,7 +12,7 @@ default = 100 words_dict = {} -def load_recognized_word(filename): +def load_recognized_words(filename): print(filename) words = set([]) @@ -80,7 +80,7 @@ def filter_recognized_words(filename): def save_merged_words(filename): print(filename) - wordfile = open(filename, "r") + wordfile = open(filename, "w") for word, pairs in merged_words_dict.items(): pinyins = {} for pinyin, freq in pairs: @@ -91,7 +91,7 @@ def save_merged_words(filename): freqsum = sum([ freq for pinyin, freq in pinyins.items() ]) - for pinyin, freq in pairs.items(): + for pinyin, freq in pinyins.items(): freq = int(default * freq / freqsum) if freq < minimum: @@ -99,7 +99,7 @@ def save_merged_words(filename): freq = str(freq) - oneline = '\t'.join(word, pinyin, freq) + oneline = '\t'.join((word, pinyin, freq)) wordfile.writelines([oneline, os.linesep]) wordfile.close() |