blob: 5e9558277d4e737d86ef0eb68346da0ce52f1e57 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
|
import os
class MyConfig:
''' My Configuration '''
m_current_epoch = {'SegmentEpoch': 1, \
'GenerateEpoch': 2, \
'EstimateEpoch': 3, \
'PruneEpoch': 4, \
'EvaluateEpoch': 5 \
}
def getSegmentEpoch(self):
return self.m_current_epoch['SegmentEpoch']
def getGenerateEpoch(self):
return self.m_current_epoch['GenerateEpoch']
def getEstimateEpoch(self):
return self.m_current_epoch['EstimateEpoch']
def getPruneEpoch(self):
return self.m_current_epoch['PruneEpoch']
def getEvaluateEpoch(self):
return self.m_current_epoch['EvaluateEpoch']
m_trainer_dir = '/media/data/Program/trainer'
def getBaseDir(self):
return self.m_trainer_dir
def getTextDir(self):
return self.m_trainer_dir + os.sep + 'texts'
def getModelDir(self):
return self.m_trainer_dir + os.sep + 'models'
def getFinalModelDir(self):
return self.m_trainer_dir + os.sep + 'finals'
#about 1,200 Chinese characters
m_minimum_chinese_characters = 1200
m_minimum_file_size = m_minimum_chinese_characters * 3 + \
m_minimum_chinese_characters / 2
def getMinimumFileSize(self):
return self.m_minimum_file_size
m_segment_postfix = '.segmented'
def getSegmentPostfix(self):
return self.m_segment_postfix
#For both index page, item page and binary model file
m_status_postfix = '.status'
def getStatusPostfix(self):
return self.m_status_postfix
m_index_postfix = '.index'
def getIndexPostfix(self):
return self.m_index_postfix
m_text_postfix = '.text'
def getTextPostfix(self):
return self.m_text_postfix
m_final_model_file_name = 'interpolation.text'
def getFinalModelFileName(self):
return self.m_final_model_file_name
|