From f332a01334342bdd4169324bdf889386ff3676fa Mon Sep 17 00:00:00 2001 From: Peng Wu Date: Thu, 24 Nov 2011 13:02:10 +0800 Subject: increase train_factor because of larger model data --- src/lookup/pinyin_lookup.cpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/lookup/pinyin_lookup.cpp b/src/lookup/pinyin_lookup.cpp index d6ba68c..7146e51 100644 --- a/src/lookup/pinyin_lookup.cpp +++ b/src/lookup/pinyin_lookup.cpp @@ -449,7 +449,7 @@ bool PinyinLookup::train_result(PinyinKeyVector keys, CandidateConstraints const //TODO: verify the new training method. phrase_token_t last_token = sentence_start; // constraints->len + 1 == results->len - guint32 train_factor = 23; + guint32 train_factor = 23 * 5; for ( size_t i = 0; i < constraints->len; ++i){ phrase_token_t * token = &g_array_index(results, phrase_token_t, i); if ( *token == null_token ) @@ -466,7 +466,7 @@ bool PinyinLookup::train_result(PinyinKeyVector keys, CandidateConstraints const //std::cout<<"i:"<get_phrase_item(*token, m_cache_phrase_item); m_cache_phrase_item.increase_pinyin_possibility(*m_custom, pinyin_keys + i, train_factor); - m_phrase_index->add_unigram_frequency(*token, train_factor); + m_phrase_index->add_unigram_frequency(*token, train_factor * 10); if ( last_token ){ SingleGram * system, *user; m_system_bigram->load(last_token, system); -- cgit