From 8b17bffcfee66a5db74243d380ba82c19f397b9b Mon Sep 17 00:00:00 2001 From: Peng Wu Date: Fri, 18 Jan 2013 16:53:44 +0800 Subject: write getPartialWordList func --- partialword.py | 20 ++++++++++++++++++++ 1 file changed, 20 insertions(+) (limited to 'partialword.py') diff --git a/partialword.py b/partialword.py index 30e1ba0..d82b7e4 100644 --- a/partialword.py +++ b/partialword.py @@ -92,3 +92,23 @@ def dropNgramTableClone(conn): cur.execute(DROP_NGRAM_FTS_DML) conn.commit() + + +#from 2-gram.db +def getPartialWordList(conn, threshold): + print(threshold) + + words_list = [] + sep = config.getWordSep() + + cur = conn.cursor() + rows = cur.execute(SELECT_PARTIAL_WORD_DML, (threshold, )).fetchall() + + for row in rows: + (words_str, freq) = row + (prefix, postfix) = words_str.strip(sep).split(sep, 1) + merged_word = prefix + postfix + words_list.append((merged_word, prefix, postfix, freq)) + + conn.commit() + return words_list -- cgit