From 314568bc3dee76b2fc4a0f7f1ea7d06b4ca48bde Mon Sep 17 00:00:00 2001 From: Peng Wu Date: Thu, 8 Aug 2013 13:18:10 +0800 Subject: update scripts --- scripts/correct.py | 95 -------------------------------------------------- scripts/pinyintable.py | 25 ------------- 2 files changed, 120 deletions(-) delete mode 100644 scripts/correct.py (limited to 'scripts') diff --git a/scripts/correct.py b/scripts/correct.py deleted file mode 100644 index ffd5998..0000000 --- a/scripts/correct.py +++ /dev/null @@ -1,95 +0,0 @@ -# -*- coding: utf-8 -*- -# vim:set et sts=4 sw=4: -# -# libpinyin - Library to deal with pinyin. -# -# Copyright (c) 2007-2008 Peng Huang -# Copyright (C) 2011 Peng Wu -# -# This program is free software; you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation; either version 2, or (at your option) -# any later version. -# -# This program is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with this program; if not, write to the Free Software -# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. - -auto_correct = [ - # "correct", "wrong" - ("ng", "gn"), - ("ng", "mg"), - ("iu", "iou"), - ("ui", "uei"), - ("un", "uen"), -# ("ue", "ve"), - ("ve", "ue"), - ("ong", "on"), -] - -auto_correct_ext = [ - # "correct", "wrong", flag - ("ju", "jv", "PINYIN_CORRECT_V_U"), - ("qu", "qv", "PINYIN_CORRECT_V_U"), - ("xu", "xv", "PINYIN_CORRECT_V_U"), - ("yu", "yv", "PINYIN_CORRECT_V_U"), - - ("jue", "jve", "PINYIN_CORRECT_V_U"), - ("que", "qve", "PINYIN_CORRECT_V_U"), - ("xue", "xve", "PINYIN_CORRECT_V_U"), - ("yue", "yve", "PINYIN_CORRECT_V_U"), - - ("juan", "jvan", "PINYIN_CORRECT_V_U"), - ("quan", "qvan", "PINYIN_CORRECT_V_U"), - ("xuan", "xvan", "PINYIN_CORRECT_V_U"), - ("yuan", "yvan", "PINYIN_CORRECT_V_U"), - - ("jun", "jvn", "PINYIN_CORRECT_V_U"), - ("qun", "qvn", "PINYIN_CORRECT_V_U"), - ("xun", "xvn", "PINYIN_CORRECT_V_U"), - ("yun", "yvn", "PINYIN_CORRECT_V_U"), - -# ("juang", "jvang", "PINYIN_CORRECT_V_U"), -# ("quang", "qvang", "PINYIN_CORRECT_V_U"), -# ("xuang", "xvang", "PINYIN_CORRECT_V_U"), -# ("yuang", "yvang", "PINYIN_CORRECT_V_U"), - -# ("jun", "jven", "PINYIN_CORRECT_UEN_UN | PINYIN_CORRECT_V_U"), -# ("qun", "qven", "PINYIN_CORRECT_UEN_UN | PINYIN_CORRECT_V_U"), -# ("xun", "xven", "PINYIN_CORRECT_UEN_UN | PINYIN_CORRECT_V_U"), -# ("yun", "yven", "PINYIN_CORRECT_UEN_UN | PINYIN_CORRECT_V_U"), -] - - -''' -fuzzy_shengmu = [ - ("c", "ch"), - ("ch", "c"), - ("z", "zh"), - ("zh", "z"), - ("s", "sh"), - ("sh", "s"), - ("l", "n"), - ("n", "l"), - ("f", "h"), - ("h", "f"), - ("l", "r"), - ("r", "l"), - ("k", "g"), - ("g", "k"), -] - -fuzzy_yunmu = [ - ("an", "ang"), - ("ang", "an"), - ("en", "eng"), - ("eng", "en"), - ("in", "ing"), - ("ing", "in"), -] -''' diff --git a/scripts/pinyintable.py b/scripts/pinyintable.py index bddf2dc..cd2a3db 100644 --- a/scripts/pinyintable.py +++ b/scripts/pinyintable.py @@ -23,7 +23,6 @@ import pinyin import bopomofo import chewing import itertools -from correct import * pinyin_list = sorted(bopomofo.PINYIN_BOPOMOFO_MAP.keys()) @@ -87,8 +86,6 @@ def get_chewing(pinyin_key): def gen_pinyin_list(): for p in itertools.chain(gen_pinyins(), gen_shengmu(), - gen_corrects(), - gen_u_to_v(), ): yield p @@ -135,28 +132,6 @@ def gen_shengmu(): flags, chewing_key -def gen_corrects(): - #generate corrections - for correct, wrong in auto_correct: - flags = ['IS_PINYIN', 'PINYIN_CORRECT_{0}_{1}'.format(wrong.upper(), - correct.upper())] - for pinyin_key in pinyin_list: - #fixes partial pinyin instead of the whole pinyin - if pinyin_key.endswith(correct) and pinyin_key != correct: - chewing_key = bopomofo.PINYIN_BOPOMOFO_MAP[pinyin_key] - new_pinyin_key = pinyin_key.replace(correct, wrong) - yield pinyin_key, new_pinyin_key, chewing_key,\ - flags, get_chewing(pinyin_key) - - -def gen_u_to_v(): - #generate U to V - for correct, wrong, flags in auto_correct_ext: - #over-ride flags - flags = ['IS_PINYIN', 'PINYIN_CORRECT_V_U'] - pinyin_key = correct - chewing_key = bopomofo.PINYIN_BOPOMOFO_MAP[pinyin_key] - yield correct, wrong, chewing_key, flags, get_chewing(pinyin_key) ### main function ### if __name__ == "__main__": -- cgit