summaryrefslogtreecommitdiffstats
path: root/lib/myconfig.py
blob: bea11a3d9109280de65d0c225de37707ce65fb49 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
import os


class MyConfig:
    ''' My Configuration '''

    m_current_epoch = {'SegmentEpoch': 1, \
                           'GenerateEpoch': 2, \
                           'EstimateEpoch': 3, \
                           'PruneEpoch': 4, \
                           'EvaluateEpoch': 5 \
                           }

    def getEpochs(self):
        return self.m_current_epoch

    m_trainer_dir = '/media/data/Program/trainer'

    def getBaseDir(self):
        return self.m_trainer_dir

    def getTextDir(self):
        return self.m_trainer_dir + os.sep + 'texts'

    def getModelDir(self):
        return self.m_trainer_dir + os.sep + 'models'

    def getFinalModelDir(self):
        return self.m_trainer_dir + os.sep + 'finals'

    m_tools_dir = '/media/data/Program/trainer/tools/libpinyin'

    def getToolsDir(self):
        return self.m_tools_dir

    m_evals_dir = '/media/data/Program/trainer/evals/libpinyin'

    def getEvalsDir(self):
        return self.m_evals_dir

    #about 1,200 Chinese characters
    m_minimum_chinese_characters = 1200
    m_minimum_file_size = m_minimum_chinese_characters * 3 + \
        m_minimum_chinese_characters / 2

    def getMinimumFileSize(self):
        return self.m_minimum_file_size

    m_candidate_model_size = 11.9 * 1024 * 1024

    #the trained corpus size of model candidates
    def getCandidateModelSize(self):
        return self.m_candidate_model_size

    m_candidate_model_name = "model-candidates-{0}.db"

    def getCandidateModelName(self, index):
        return self.m_candidate_model_name.format(index)
        
    m_segment_postfix = '.segmented'

    def getSegmentPostfix(self):
        return self.m_segment_postfix

    m_segment_report_postfix = '.segment.report'

    def getSegmentReportPostfix(self):
        return self.m_segment_report_postfix

    #For both index page, item page and binary model file
    m_status_postfix = '.status'

    def getStatusPostfix(self):
        return self.m_status_postfix

    m_index_postfix = '.index'

    def getIndexPostfix(self):
        return self.m_index_postfix

    m_text_postfix = '.text'

    def getTextPostfix(self):
        return self.m_text_postfix

    m_final_model_file_name = 'interpolation.text'

    def getFinalModelFileName(self):
        return self.m_final_model_file_name