summaryrefslogtreecommitdiffstats
path: root/utils/training/gen_ngram.cpp
diff options
context:
space:
mode:
authorPeng Wu <alexepico@gmail.com>2011-04-19 10:12:12 +0800
committerPeng Wu <alexepico@gmail.com>2011-04-19 10:12:12 +0800
commit1bd05a07d29dbe3f8b03ae73b879797aea8c653a (patch)
tree3cb34b4e8f4b1f9937e172fe5d156cf728d7146d /utils/training/gen_ngram.cpp
parentd74fda51c92a80d195f9e7030dc7cf1ddb47f23d (diff)
downloadlibpinyin-1bd05a07d29dbe3f8b03ae73b879797aea8c653a.tar.gz
libpinyin-1bd05a07d29dbe3f8b03ae73b879797aea8c653a.tar.xz
libpinyin-1bd05a07d29dbe3f8b03ae73b879797aea8c653a.zip
fixes phrase large table
Diffstat (limited to 'utils/training/gen_ngram.cpp')
-rw-r--r--utils/training/gen_ngram.cpp3
1 files changed, 3 insertions, 0 deletions
diff --git a/utils/training/gen_ngram.cpp b/utils/training/gen_ngram.cpp
index 3203cd1..918c9c8 100644
--- a/utils/training/gen_ngram.cpp
+++ b/utils/training/gen_ngram.cpp
@@ -100,6 +100,9 @@ int main(int argc, char * argv[]){
glong phrase_len = 0;
utf16_t * phrase = g_utf8_to_utf16(linebuf, -1, NULL, &phrase_len, NULL);
+ if ( phrase_len == 0 )
+ continue;
+
phrase_token_t token = 0;
int result = g_phrases->search( phrase_len, phrase, token);
if ( ! (result & SEARCH_OK) )