summaryrefslogtreecommitdiffstats
path: root/utils
diff options
context:
space:
mode:
authorPeng Wu <alexepico@gmail.com>2011-06-09 18:04:45 +0800
committerPeng Wu <alexepico@gmail.com>2011-06-09 18:04:45 +0800
commitc7aeb1c57cea4f458b3084a34397e44110297ac8 (patch)
treef7106f74ed43e132d2029340b06a8e351c526b80 /utils
parent982cb961cec5f400a52948a17e3d33ae10bb90b4 (diff)
downloadlibpinyin-c7aeb1c57cea4f458b3084a34397e44110297ac8.tar.gz
libpinyin-c7aeb1c57cea4f458b3084a34397e44110297ac8.tar.xz
libpinyin-c7aeb1c57cea4f458b3084a34397e44110297ac8.zip
fixes read document
Diffstat (limited to 'utils')
-rw-r--r--utils/training/gen_deleted_ngram.cpp13
-rw-r--r--utils/training/gen_k_mixture_model.cpp16
-rw-r--r--utils/training/gen_ngram.cpp13
3 files changed, 21 insertions, 21 deletions
diff --git a/utils/training/gen_deleted_ngram.cpp b/utils/training/gen_deleted_ngram.cpp
index 93986d6..b39490f 100644
--- a/utils/training/gen_deleted_ngram.cpp
+++ b/utils/training/gen_deleted_ngram.cpp
@@ -78,13 +78,14 @@ int main(int argc, char * argv[]){
glong phrase_len = 0;
utf16_t * phrase = g_utf8_to_utf16(linebuf, -1, NULL, &phrase_len, NULL);
- if ( phrase_len == 0 )
- continue;
-
phrase_token_t token = 0;
- int result = g_phrases->search( phrase_len, phrase, token);
- if ( ! (result & SEARCH_OK) )
- token = 0;
+ if ( 0 != phrase_len ) {
+ int result = g_phrases->search( phrase_len, phrase, token);
+ if ( ! (result & SEARCH_OK) )
+ token = 0;
+ g_free(phrase);
+ phrase = NULL;
+ }
last_token = cur_token;
cur_token = token;
diff --git a/utils/training/gen_k_mixture_model.cpp b/utils/training/gen_k_mixture_model.cpp
index 13ff04d..bd350b4 100644
--- a/utils/training/gen_k_mixture_model.cpp
+++ b/utils/training/gen_k_mixture_model.cpp
@@ -60,16 +60,14 @@ bool read_document(PhraseLargeTable * phrases, FILE * document,
glong phrase_len = 0;
utf16_t * phrase = g_utf8_to_utf16(linebuf, -1, NULL, &phrase_len, NULL);
- if ( phrase_len == 0 )
- continue;
-
phrase_token_t token = 0;
- int search_result = phrases->search( phrase_len, phrase, token );
- if ( ! (search_result & SEARCH_OK) )
- token = 0;
-
- g_free(phrase);
- phrase = NULL;
+ if ( 0 != phrase_len ) {
+ int search_result = phrases->search( phrase_len, phrase, token );
+ if ( ! (search_result & SEARCH_OK) )
+ token = 0;
+ g_free(phrase);
+ phrase = NULL;
+ }
last_token = cur_token;
cur_token = token;
diff --git a/utils/training/gen_ngram.cpp b/utils/training/gen_ngram.cpp
index 9e79f1d..2b0e1dd 100644
--- a/utils/training/gen_ngram.cpp
+++ b/utils/training/gen_ngram.cpp
@@ -91,13 +91,14 @@ int main(int argc, char * argv[]){
glong phrase_len = 0;
utf16_t * phrase = g_utf8_to_utf16(linebuf, -1, NULL, &phrase_len, NULL);
- if ( phrase_len == 0 )
- continue;
-
phrase_token_t token = 0;
- int result = g_phrases->search( phrase_len, phrase, token);
- if ( ! (result & SEARCH_OK) )
- token = 0;
+ if ( 0 != phrase_len ) {
+ int result = g_phrases->search( phrase_len, phrase, token);
+ if ( ! (result & SEARCH_OK) )
+ token = 0;
+ g_free(phrase);
+ phrase = NULL;
+ }
last_token = cur_token;
cur_token = token;