diff options
author | Jinesh K J <jinsbond007@jinesh.cvit> | 2009-04-06 04:15:42 +0530 |
---|---|---|
committer | Jinesh K J <jinsbond007@jinesh.cvit> | 2009-04-06 04:15:42 +0530 |
commit | 97f2231e942f67450b27f161da11e863334921ba (patch) | |
tree | 347f1882366196a37e9d86442770760d0e348ce5 /silpa/modules/ngram/sample_ngram.py | |
parent | bba7b4bc146bb4623c6cc6ad27d70baf2e02497a (diff) | |
download | Rachana.git-97f2231e942f67450b27f161da11e863334921ba.tar.gz Rachana.git-97f2231e942f67450b27f161da11e863334921ba.tar.xz Rachana.git-97f2231e942f67450b27f161da11e863334921ba.zip |
the ngram code is changed and removed all hard codings
Diffstat (limited to 'silpa/modules/ngram/sample_ngram.py')
-rw-r--r-- | silpa/modules/ngram/sample_ngram.py | 17 |
1 files changed, 4 insertions, 13 deletions
diff --git a/silpa/modules/ngram/sample_ngram.py b/silpa/modules/ngram/sample_ngram.py index 0f46ad6..d373aa8 100644 --- a/silpa/modules/ngram/sample_ngram.py +++ b/silpa/modules/ngram/sample_ngram.py @@ -26,17 +26,7 @@ import codecs import pickle import sys from visualizer import NGramVisualizer -def genCorpus(infile,corpus): - ngv=NGramVisualizer () - try: - corpusfile = open(corpus) - except IOError: - graph_dict = dict() - else: - graph_dict = pickle.load(corpusfile) -# corpusfile.close() - graph_dict=ngv.loadCorpus (infile,graph_dict) - pickle.dump(graph_dict,open(corpus,'w')) + def printGraph(corpus,start_word): ngv=NGramVisualizer () graph_dict=pickle.load(open(corpus)) @@ -51,7 +41,7 @@ if __name__ == "__main__": """ python sample_ngram.py <input file> <corpus path> 1 this will generate the corpus for the given input file, if corpus specified at - corpus path is empty. Else it will recreate the corpus for the with the additional files. + corpus path is empty. Else it will recreate the corpus with the additional data. python sample_ngram.py <corpus path> <start word> 2 this will generate the graph for the given start word in the given corpus at corpus path. @@ -59,6 +49,7 @@ if __name__ == "__main__": This is just a crude attempt, a lot more improvement is to be done. """ if sys.argv[3] == "1": - genCorpus(sys.argv[1],sys.argv[2]) + ngv=NGramVisualizer () + ngv.loadCorpus(sys.argv[1],sys.argv[2]) elif sys.argv[3] == "2": printGraph(sys.argv[1],sys.argv[2]) |