summaryrefslogtreecommitdiffstats
path: root/silpa/www/utils/langdetect.py
diff options
context:
space:
mode:
Diffstat (limited to 'silpa/www/utils/langdetect.py')
-rw-r--r--silpa/www/utils/langdetect.py76
1 files changed, 0 insertions, 76 deletions
diff --git a/silpa/www/utils/langdetect.py b/silpa/www/utils/langdetect.py
deleted file mode 100644
index a75ba15..0000000
--- a/silpa/www/utils/langdetect.py
+++ /dev/null
@@ -1,76 +0,0 @@
-# Spellchecker with language detection
-# coding: utf-8
-#
-# Copyright © 2008 Santhosh Thottingal
-# Released under the GPLV3+ license
-
-from common import *
-
-class LangDetect(SilpaModule):
-
- def detect_lang(self, text):
- words=text.split(" ")
- word_count=len(words)
- word_iter=0
- word=""
- result_dict=dict()
- while word_iter < word_count:
- word=words[word_iter]
- if(word):
- length = len(word)
- index = 0
- while index < length:
- letter=word[index]
- if ((letter >= u'ം') & (letter <=u'൯')):
- result_dict[word]= "ml_IN"
- if ((letter >= u'ঁ') & (letter <= u'৺')):
- result_dict[word]= "bn_IN"
- if ((letter >= u'ँ') & (letter <= u'ॿ')):
- result_dict[word]= "hi_IN"
- if ((letter >=u'ઁ') & (letter <= u'૱')):
- result_dict[word]= "gu_IN"
- if ((letter >= u'ਁ') & (letter <=u'ੴ')):
- result_dict[word]= "pa_IN"
- if ((letter >= u'ಂ') & (letter <=u'ೲ')):
- result_dict[word]= "ka_IN"
- if ((letter >= u'ଁ') & (letter <= u'ୱ')):
- result_dict[word]= "or_IN"
- if ((letter >=u'ஂ') & (letter <= u'௺')):
- result_dict[word]= "ta_IN"
- if ((letter >=u'ఁ') & (letter <= u'౯')):
- result_dict[word]= "te_IN"
- if ((letter <= u'z')):
- result_dict[word]= "en_US"
-
- index=index+1
- word_iter=word_iter+1
- return result_dict
- def process(self,form):
- response = """
- <h2>Language Detection</h2></hr>
- <p>Enter the text for detecting the language in the below text area.
- Language of each word will be detected.
- You can give the text in any language and even with mixed language
- </p>
- <form action="" method="post">
- <textarea cols='100' rows='25' name='input_text' id='id1'>%s</textarea>
- <input type="submit" id="Detect Language" value="Detect Language" name="action" style="width:12em;"/>
- <input type="reset" value="Clear" style="width:12em;"/>
- </br>
- </form>
- """
- if(form.has_key('input_text')):
- text = action=form['input_text'].value .decode('utf-8')
- response=response % text
- detected_lang_dict = self.detect_lang(text)
- response = response+"<h2>Language Detection Results</h2></hr>"
- response = response+"<table><th><td>Word</td><td>Language</td></th>"
- for key in detected_lang_dict:
- response = response+"<tr><td>"+key+"</td><td>"+detected_lang_dict[key]+"</td></tr>"
- response = response+"</table> "
- else:
- response=response % ""
- return response
-
-def getInstance():
- return LangDetect()