rename files

author: Peng Wu <alexepico@gmail.com> 2011-11-02 12:08:45 +0800
committer: Peng Wu <alexepico@gmail.com> 2011-11-02 12:08:45 +0800
commit: 2ef0735e5fafa28a51ec04cf8e24e21c7486a040 (patch)
tree: 4f5498cb8ea1cb26c3301151b53e79d7f08765ce /scripts/genspecialtable.py
parent: d894cf14145e54d934d0490aae80bfb8c7aafb79 (diff)
download: libpinyin-2ef0735e5fafa28a51ec04cf8e24e21c7486a040.tar.gz
libpinyin-2ef0735e5fafa28a51ec04cf8e24e21c7486a040.tar.xz
libpinyin-2ef0735e5fafa28a51ec04cf8e24e21c7486a040.zip
1 files changed, 0 insertions, 105 deletions
diff --git a/scripts/genspecialtable.py b/scripts/genspecialtable.py
deleted file mode 100644
index 928ca9e..0000000
--- a/scripts/genspecialtable.py
+++ /dev/null
@@ -1,105 +0,0 @@
-# -*- coding: utf-8 -*-
-# vim:set et sts=4 sw=4:
-#
-# libpinyin - Library to deal with pinyin.
-#
-# Copyright (C) 2011 Peng Wu <alexepico@gmail.com>
-#
-# This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation; either version 2, or (at your option)
-# any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program; if not, write to the Free Software
-# Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
-
-
-import os
-import sys
-import math
-import pinyin
-
-pinyin_list = sorted(pinyin.PINYIN_LIST)
-shengmu_list = sorted(pinyin.SHENGMU_LIST)
-yunmu_list = sorted(pinyin.YUNMU_LIST)
-
-phrase_dict = {}
-
-
-def load_phrase(filename):
-    phrasefile = open(filename, "r")
-    for line in phrasefile.readlines():
-        line = line.rstrip(os.linesep)
-        (pinyin_str, freq) = line.split(' ', 1)
-        freq = int(math.floor(float(freq)))
-        if 0 == freq:
-            #print(pinyin_str)
-            continue
-
-        (first_key, second_key) = pinyin_str.split("'")
-        if first_key[-1].isdigit():
-            first_key = first_key[:-1]
-        if second_key[-1].isdigit():
-            second_key = second_key[:-1]
-        phrase_dict[(first_key, second_key)] = freq
-    phrasefile.close()
-
-
-def gen_all_divided():
-    for pinyin_key in pinyin_list:
-        for first_key in pinyin_list:
-            if len(pinyin_key) <= len(first_key):
-                continue
-            if not pinyin_key.startswith(first_key):
-                continue
-            second_key = pinyin_key[len(first_key):]
-            if second_key in pinyin_list:
-                yield pinyin_key, first_key, second_key
-
-
-def filter_divided():
-    for (pinyin_key, first_key, second_key) in gen_all_divided():
-        if not (first_key, second_key) in phrase_dict:
-            continue
-        freq = phrase_dict[(first_key, second_key)]
-        yield pinyin_key, first_key, second_key, freq
-
-
-def gen_all_resplit():
-    for pinyin_key in pinyin_list:
-        if pinyin_key[-1] in ["n", "g", "r"]:
-            for yun in yunmu_list:
-                if yun not in pinyin_list:
-                    continue
-                new_pinyin_key = pinyin_key[-1] + yun
-                # if new_pinyin in pinyin_list:
-                yield pinyin_key, yun, pinyin_key[:-1], new_pinyin_key
-        elif pinyin_key[-1] in ["e"]:
-            yield pinyin_key, "r", pinyin_key[:-1], "er"
-
-
-def filter_resplit():
-    for (orig_first_key, orig_second_key, new_first_key, new_second_key) \
-    in gen_all_resplit():
-        if not (new_first_key, new_second_key) in phrase_dict:
-            continue
-        orig_freq = 0
-        new_freq = phrase_dict[(new_first_key, new_second_key)]
-        if (orig_first_key, orig_second_key) in phrase_dict:
-            orig_freq = phrase_dict[(orig_first_key, orig_second_key)]
-        yield orig_first_key, orig_second_key, orig_freq, \
-        new_first_key, new_second_key, new_freq
-
-
-if __name__ == "__main__":
-    load_phrase("pinyin2.txt")
-    for p in filter_divided():
-        print (p)
-    for p in filter_resplit():
-        print (p)
author	Peng Wu <alexepico@gmail.com>	2011-11-02 12:08:45 +0800
committer	Peng Wu <alexepico@gmail.com>	2011-11-02 12:08:45 +0800
commit	2ef0735e5fafa28a51ec04cf8e24e21c7486a040 (patch)
tree	4f5498cb8ea1cb26c3301151b53e79d7f08765ce /scripts/genspecialtable.py
parent	d894cf14145e54d934d0490aae80bfb8c7aafb79 (diff)
download	libpinyin-2ef0735e5fafa28a51ec04cf8e24e21c7486a040.tar.gz libpinyin-2ef0735e5fafa28a51ec04cf8e24e21c7486a040.tar.xz libpinyin-2ef0735e5fafa28a51ec04cf8e24e21c7486a040.zip