From 3d731193a89fa725eec0bfce92489df0be7a272c Mon Sep 17 00:00:00 2001 From: Peng Wu Date: Thu, 24 Nov 2011 13:02:10 +0800 Subject: increase train_factor because of larger model data --- src/lookup/pinyin_lookup.cpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) (limited to 'src/lookup/pinyin_lookup.cpp') diff --git a/src/lookup/pinyin_lookup.cpp b/src/lookup/pinyin_lookup.cpp index 99e2a20..2a4d191 100644 --- a/src/lookup/pinyin_lookup.cpp +++ b/src/lookup/pinyin_lookup.cpp @@ -448,7 +448,7 @@ bool PinyinLookup::train_result(PinyinKeyVector keys, CandidateConstraints const //TODO: verify the new training method. phrase_token_t last_token = sentence_start; // constraints->len + 1 == results->len - guint32 train_factor = 23; + guint32 train_factor = 23 * 5; for ( size_t i = 0; i < constraints->len; ++i){ phrase_token_t * token = &g_array_index(results, phrase_token_t, i); if ( *token == null_token ) @@ -465,7 +465,7 @@ bool PinyinLookup::train_result(PinyinKeyVector keys, CandidateConstraints const //printf("i:%d\tlast_token:%d\ttoken:%d\n", i, last_token, *token); m_phrase_index->get_phrase_item(*token, m_cache_phrase_item); m_cache_phrase_item.increase_pinyin_possibility(*m_custom, pinyin_keys + i, train_factor); - m_phrase_index->add_unigram_frequency(*token, train_factor); + m_phrase_index->add_unigram_frequency(*token, train_factor * 10); if ( last_token ){ SingleGram * system, *user; m_system_bigram->load(last_token, system); -- cgit