summaryrefslogtreecommitdiffstats
path: root/silpa
diff options
context:
space:
mode:
authorSanthosh Thottingal <santhosh.thottingal@gmail.com>2009-03-24 22:56:09 +0530
committerSanthosh Thottingal <santhosh.thottingal@gmail.com>2009-03-24 22:56:09 +0530
commit8de2fcccd538d72730a4b34cf75f1b44294f8435 (patch)
tree456e47c5eff47dcb5199f5141eebca4c4ed90a97 /silpa
parent77998dd48512bf309060911eaaf94758a5886b95 (diff)
downloadRachana.git-8de2fcccd538d72730a4b34cf75f1b44294f8435.tar.gz
Rachana.git-8de2fcccd538d72730a4b34cf75f1b44294f8435.tar.xz
Rachana.git-8de2fcccd538d72730a4b34cf75f1b44294f8435.zip
Hyphenator Module for Silpa
Diffstat (limited to 'silpa')
-rw-r--r--silpa/modules/__init__.py1
-rw-r--r--silpa/modules/hyphenator/__init__.py2
-rw-r--r--silpa/modules/hyphenator/rules/hyph_bn_IN.dic82
-rw-r--r--silpa/modules/hyphenator/rules/hyph_gu_IN.dic86
-rw-r--r--silpa/modules/hyphenator/rules/hyph_hi_IN.dic92
-rw-r--r--silpa/modules/hyphenator/rules/hyph_kn_IN.dic91
-rw-r--r--silpa/modules/hyphenator/rules/hyph_ml_IN.dic93
-rw-r--r--silpa/modules/hyphenator/rules/hyph_or_IN.dic85
-rw-r--r--silpa/modules/hyphenator/rules/hyph_pa_IN.dic83
-rw-r--r--silpa/modules/hyphenator/rules/hyph_ta_IN.dic77
-rw-r--r--silpa/modules/hyphenator/rules/hyph_te_IN.dic91
11 files changed, 783 insertions, 0 deletions
diff --git a/silpa/modules/__init__.py b/silpa/modules/__init__.py
index a436dc9..4ebcec0 100644
--- a/silpa/modules/__init__.py
+++ b/silpa/modules/__init__.py
@@ -1,3 +1,4 @@
#! /usr/bin/env python
# -*- coding: utf-8 -*-
from lemmatizer import *
+from hyphenator import *
diff --git a/silpa/modules/hyphenator/__init__.py b/silpa/modules/hyphenator/__init__.py
new file mode 100644
index 0000000..e1f7e6e
--- /dev/null
+++ b/silpa/modules/hyphenator/__init__.py
@@ -0,0 +1,2 @@
+#! /usr/bin/env python
+# -*- coding: utf-8 -*-
diff --git a/silpa/modules/hyphenator/rules/hyph_bn_IN.dic b/silpa/modules/hyphenator/rules/hyph_bn_IN.dic
new file mode 100644
index 0000000..52acee5
--- /dev/null
+++ b/silpa/modules/hyphenator/rules/hyph_bn_IN.dic
@@ -0,0 +1,82 @@
+UTF-8
+% Hyphenation for Bengali
+% Copyright (C) 2008 Santhosh Thottingal <santhosh.thottingal@gmail.com>
+%
+% This library is free software; you can redistribute it and/or
+% modify it under the terms of the GNU General Public
+% License as published by the Free Software Foundation;
+% version 3 or later version of the License.
+%
+% This library is distributed in the hope that it will be useful,
+% but WITHOUT ANY WARRANTY; without even the implied warranty of
+% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+% Lesser General Public License for more details.
+%
+% You should have received a copy of the GNU General Public
+% License along with this library; if not, write to the Free Software
+% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+%
+
+অ1
+আ1
+ই1
+ঈ1
+উ1
+ঊ1
+ঋ1
+এ1
+ঐ1
+ঔ1
+া1
+ি1
+ী1
+ু1
+ে1
+ো1
+ৈ1
+ৌ1
+ৗ1
+্2
+ঃ1
+ং1
+1ন
+ন্2
+2ন্‍
+1র
+র্2
+2র্‍
+1ল
+ল্2
+2ল্‍
+্2
+1ণ
+ণ্2
+2ণ্‍
+1ক
+1গ
+1খ
+1ঘ
+1ঙ
+1চ
+1ছ
+1জ
+1ঝ
+1ঞ
+1ট
+1ঠ
+1ড
+1ঢ
+1ত
+1থ
+1দ
+1ধ
+1প
+1ফ
+1ব
+1ভ
+1ম
+1য
+1শ
+1ষ
+1স
+1হ
diff --git a/silpa/modules/hyphenator/rules/hyph_gu_IN.dic b/silpa/modules/hyphenator/rules/hyph_gu_IN.dic
new file mode 100644
index 0000000..13b9b60
--- /dev/null
+++ b/silpa/modules/hyphenator/rules/hyph_gu_IN.dic
@@ -0,0 +1,86 @@
+UTF-8
+% Hyphenation for Gujarati
+% Copyright (C) 2008 Santhosh Thottingal <santhosh.thottingal@gmail.com>
+%
+% This library is free software; you can redistribute it and/or
+% modify it under the terms of the GNU General Public
+% License as published by the Free Software Foundation;
+% version 3 or later version of the License.
+%
+% This library is distributed in the hope that it will be useful,
+% but WITHOUT ANY WARRANTY; without even the implied warranty of
+% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+% Lesser General Public License for more details.
+%
+% You should have received a copy of the GNU General Public
+% License along with this library; if not, write to the Free Software
+% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+%
+
+અ1
+આ1
+ઇ1
+ઈ1
+ઉ1
+ઊ1
+ઋ1
+એ1
+ઐ1
+ઔ1
+ા1
+િ1
+ી1
+ુ1
+ૂ1
+ૃ1
+ે1
+ો1
+ૈ1
+ૌ1
+્2
+ઃ1
+ં1
+1ન
+ન્2
+2ન્‍
+1ર
+ર્2
+2ર્‍
+1લ
+લ્2
+2લ્‍
+1ળ
+ળ્2
+2ળ્‍
+1ણ
+ણ્2
+2ણ્‍
+1ક
+1ગ
+1ખ
+1ઘ
+1ઙ
+1ચ
+1છ
+1જ
+1ઝ
+1ઞ
+1ટ
+1ઠ
+1ડ
+1ઢ
+1ત
+1થ
+1દ
+1ધ
+1પ
+1ફ
+1બ
+1ભ
+1મ
+1ય
+1વ
+1શ
+1ષ
+1સ
+1હ
diff --git a/silpa/modules/hyphenator/rules/hyph_hi_IN.dic b/silpa/modules/hyphenator/rules/hyph_hi_IN.dic
new file mode 100644
index 0000000..dc82fbd
--- /dev/null
+++ b/silpa/modules/hyphenator/rules/hyph_hi_IN.dic
@@ -0,0 +1,92 @@
+UTF-8
+% Hyphenation for Hindi
+% Copyright (C) 2008 Santhosh Thottingal <santhosh.thottingal@gmail.com>
+%
+% This library is free software; you can redistribute it and/or
+% modify it under the terms of the GNU General Public
+% License as published by the Free Software Foundation;
+% version 3 or later version of the License.
+%
+% This library is distributed in the hope that it will be useful,
+% but WITHOUT ANY WARRANTY; without even the implied warranty of
+% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+% Lesser General Public License for more details.
+%
+% You should have received a copy of the GNU General Public
+% License along with this library; if not, write to the Free Software
+% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+%
+
+अ1
+आ1
+इ1
+ई1
+उ1
+ऊ1
+ऋ1
+ऎ1
+ए1
+ऐ1
+ऒ1
+औ1
+ा1
+ि1
+ी1
+ु1
+ू1
+ृ1
+ॆ1
+े1
+ॊ1
+ो1
+ै1
+ौ1
+्2
+ः1
+ं1
+1न
+न्2
+2न्‍
+1र
+र्2
+2र्‍
+1ल
+ल्2
+2ल्‍
+1ळ
+ळ्2
+2ळ्‍
+1ण
+ण्2
+2ण्‍
+1क
+1ग
+1ख
+1घ
+1ङ
+1च
+1छ
+1ज
+1झ
+1ञ
+1ट
+1ठ
+1ड
+1ढ
+1त
+1थ
+1द
+1ध
+1प
+1फ
+1ब
+1भ
+1म
+1य
+1व
+1श
+1ष
+1स
+1ह
+1ऴ
+1ऱ
diff --git a/silpa/modules/hyphenator/rules/hyph_kn_IN.dic b/silpa/modules/hyphenator/rules/hyph_kn_IN.dic
new file mode 100644
index 0000000..e241192
--- /dev/null
+++ b/silpa/modules/hyphenator/rules/hyph_kn_IN.dic
@@ -0,0 +1,91 @@
+UTF-8
+% Hyphenation for Kannada
+% Copyright (C) 2008 Santhosh Thottingal <santhosh.thottingal@gmail.com>
+%
+% This library is free software; you can redistribute it and/or
+% modify it under the terms of the GNU General Public
+% License as published by the Free Software Foundation;
+% version 3 or later version of the License.
+%
+% This library is distributed in the hope that it will be useful,
+% but WITHOUT ANY WARRANTY; without even the implied warranty of
+% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+% Lesser General Public License for more details.
+%
+% You should have received a copy of the GNU General Public
+% License along with this library; if not, write to the Free Software
+% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+%
+
+ಅ1
+ಆ1
+ಇ1
+ಈ1
+ಉ1
+ಊ1
+ಋ1
+ಎ1
+ಏ1
+ಐ1
+ಒ1
+ಔ1
+ಾ1
+ಿ1
+ೀ1
+ು1
+ೂ1
+ೃ1
+ೆ1
+ೇ1
+ೊ1
+ೋ1
+ೈ1
+ೌ1
+್2
+ಃ1
+ಂ1
+1ನ
+ನ್2
+2ನ್‍
+1ರ
+ರ್2
+2ರ್‍
+1ಲ
+ಲ್2
+2ಲ್‍
+1ಳ
+ಳ್2
+2ಳ್‍
+1ಣ
+ಣ್2
+2ಣ್‍
+1ಕ
+1ಗ
+1ಖ
+1ಘ
+1ಙ
+1ಚ
+1ಛ
+1ಜ
+1ಝ
+1ಞ
+1ಟ
+1ಠ
+1ಡ
+1ಢ
+1ತ
+1ಥ
+1ದ
+1ಧ
+1ಪ
+1ಫ
+1ಬ
+1ಭ
+1ಮ
+1ಯ
+1ವ
+1ಶ
+1ಷ
+1ಸ
+1ಹ
+1ಱ
diff --git a/silpa/modules/hyphenator/rules/hyph_ml_IN.dic b/silpa/modules/hyphenator/rules/hyph_ml_IN.dic
new file mode 100644
index 0000000..44b50b9
--- /dev/null
+++ b/silpa/modules/hyphenator/rules/hyph_ml_IN.dic
@@ -0,0 +1,93 @@
+UTF-8
+% Hyphenation for Malayalam
+% Copyright (C) 2008 Santhosh Thottingal <santhosh.thottingal@gmail.com>
+%
+% This library is free software; you can redistribute it and/or
+% modify it under the terms of the GNU General Public
+% License as published by the Free Software Foundation;
+% version 3 or later version of the License.
+%
+% This library is distributed in the hope that it will be useful,
+% but WITHOUT ANY WARRANTY; without even the implied warranty of
+% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+% Lesser General Public License for more details.
+%
+% You should have received a copy of the GNU General Public
+% License along with this library; if not, write to the Free Software
+% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+%
+
+അ1
+ആ1
+ഇ1
+ഈ1
+ഉ1
+ഊ1
+ഋ1
+എ1
+ഏ1
+ഐ1
+ഒ1
+ഔ1
+ാ1
+ി1
+ീ1
+ു1
+ൂ1
+ൃ1
+െ1
+േ1
+ൊ1
+ോ1
+ൈ1
+ൌ1
+ൗ1
+്2
+ഃ1
+2ം1
+1ന
+ന്2
+2ന്‍
+1ര
+ര്2
+2ര്‍
+1ല
+ല്2
+2ല്‍
+1ള
+ള്2
+2ള്‍
+1ണ
+ണ്2
+2ണ്‍
+1ക
+1ഗ
+1ഖ
+1ഘ
+1ങ
+1ച
+1ഛ
+1ജ
+1ഝ
+1ഞ
+1ട
+1ഠ
+1ഡ
+1ഢ
+1ത
+1ഥ
+1ദ
+1ധ
+1പ
+1ഫ
+1ബ
+1ഭ
+1മ
+1യ
+1വ
+1ശ
+1ഷ
+1സ
+1ഹ
+1ഴ
+1റ
diff --git a/silpa/modules/hyphenator/rules/hyph_or_IN.dic b/silpa/modules/hyphenator/rules/hyph_or_IN.dic
new file mode 100644
index 0000000..c9ea024
--- /dev/null
+++ b/silpa/modules/hyphenator/rules/hyph_or_IN.dic
@@ -0,0 +1,85 @@
+UTF-8
+% Hyphenation for Oriya
+% Copyright (C) 2008 Santhosh Thottingal <santhosh.thottingal@gmail.com>
+%
+% This library is free software; you can redistribute it and/or
+% modify it under the terms of the GNU General Public
+% License as published by the Free Software Foundation;
+% version 3 or later version of the License.
+%
+% This library is distributed in the hope that it will be useful,
+% but WITHOUT ANY WARRANTY; without even the implied warranty of
+% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+% Lesser General Public License for more details.
+%
+% You should have received a copy of the GNU General Public
+% License along with this library; if not, write to the Free Software
+% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+%
+
+ଅ1
+ଆ1
+ଇ1
+ଈ1
+ଉ1
+ଊ1
+ଋ1
+ଏ1
+ଐ1
+ଔ1
+ା1
+ି1
+ୀ1
+ୁ1
+େ1
+ୋ1
+ୈ1
+ୌ1
+ୗ1
+୍2
+ଃ1
+ଂ1
+1ନ
+ନ୍2
+2ନ୍‍
+1ର
+ର୍2
+2ର୍‍
+1ଲ
+ଲ୍2
+2ଲ୍‍
+1ଳ
+ଳ୍2
+2ଳ୍‍
+1ଣ
+ଣ୍2
+2ଣ୍‍
+1କ
+1ଗ
+1ଖ
+1ଘ
+1ଙ
+1ଚ
+1ଛ
+1ଜ
+1ଝ
+1ଞ
+1ଟ
+1ଠ
+1ଡ
+1ଢ
+1ତ
+1ଥ
+1ଦ
+1ଧ
+1ପ
+1ଫ
+1ବ
+1ଭ
+1ମ
+1ଯ
+1ଵ
+1ଶ
+1ଷ
+1ସ
+1ହ
diff --git a/silpa/modules/hyphenator/rules/hyph_pa_IN.dic b/silpa/modules/hyphenator/rules/hyph_pa_IN.dic
new file mode 100644
index 0000000..fcda980
--- /dev/null
+++ b/silpa/modules/hyphenator/rules/hyph_pa_IN.dic
@@ -0,0 +1,83 @@
+UTF-8
+% Hyphenation for Panjabi(Gurmughi)
+% Copyright (C) 2008 Santhosh Thottingal <santhosh.thottingal@gmail.com>
+%
+% This library is free software; you can redistribute it and/or
+% modify it under the terms of the GNU General Public
+% License as published by the Free Software Foundation;
+% version 3 or later version of the License.
+%
+% This library is distributed in the hope that it will be useful,
+% but WITHOUT ANY WARRANTY; without even the implied warranty of
+% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+% Lesser General Public License for more details.
+%
+% You should have received a copy of the GNU General Public
+% License along with this library; if not, write to the Free Software
+% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+%
+
+ਅ1
+ਆ1
+ਇ1
+ਈ1
+ਉ1
+ਊ1
+ਏ1
+ਐ1
+ਔ1
+ਾ1
+ਿ1
+ੀ1
+ੁ1
+ੂ1
+ੇ1
+ੋ1
+ੈ1
+ੌ1
+੍2
+ਃ1
+ਂ1
+1ਨ
+ਨ੍2
+2ਨ੍‍
+1ਰ
+ਰ੍2
+2ਰ੍‍
+1ਲ
+ਲ੍2
+2ਲ੍‍
+1ਲ਼
+ਲ਼੍2
+2ਲ਼੍‍
+1ਣ
+ਣ੍2
+2ਣ੍‍
+1ਕ
+1ਗ
+1ਖ
+1ਘ
+1ਙ
+1ਚ
+1ਛ
+1ਜ
+1ਝ
+1ਞ
+1ਟ
+1ਠ
+1ਡ
+1ਢ
+1ਤ
+1ਥ
+1ਦ
+1ਧ
+1ਪ
+1ਫ
+1ਬ
+1ਭ
+1ਮ
+1ਯ
+1ਵ
+1ਸ਼
+1ਸ
+1ਹ
diff --git a/silpa/modules/hyphenator/rules/hyph_ta_IN.dic b/silpa/modules/hyphenator/rules/hyph_ta_IN.dic
new file mode 100644
index 0000000..298d7d1
--- /dev/null
+++ b/silpa/modules/hyphenator/rules/hyph_ta_IN.dic
@@ -0,0 +1,77 @@
+UTF-8
+% Hyphenation for Tamil
+% Copyright (C) 2008 Santhosh Thottingal <santhosh.thottingal@gmail.com>
+%
+% This library is free software; you can redistribute it and/or
+% modify it under the terms of the GNU General Public
+% License as published by the Free Software Foundation;
+% version 3 or later version of the License.
+%
+% This library is distributed in the hope that it will be useful,
+% but WITHOUT ANY WARRANTY; without even the implied warranty of
+% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+% Lesser General Public License for more details.
+%
+% You should have received a copy of the GNU General Public
+% License along with this library; if not, write to the Free Software
+% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+%
+
+அ1
+ஆ1
+இ1
+ஈ1
+உ1
+ஊ1
+எ1
+ஏ1
+ஐ1
+ஒ1
+ஔ1
+ா1
+ி1
+ீ1
+ு1
+ூ1
+ெ1
+ே1
+ொ1
+ோ1
+ை1
+ௌ1
+ௗ1
+்2
+ஃ1
+ஂ1
+1ந
+ந்2
+2ந்‍
+1ர
+ர்2
+2ர்‍
+1ல
+ல்2
+2ல்‍
+1ள
+ள்2
+2ள்‍
+1ண
+ண்2
+2ண்‍
+1க
+1ங
+1ச
+1ஜ
+1ஞ
+1ட
+1த
+1ப
+1ம
+1ய
+1வ
+1ஶ
+1ஷ
+1ஸ
+1ஹ
+1ழ
+1ற
diff --git a/silpa/modules/hyphenator/rules/hyph_te_IN.dic b/silpa/modules/hyphenator/rules/hyph_te_IN.dic
new file mode 100644
index 0000000..62ddfe2
--- /dev/null
+++ b/silpa/modules/hyphenator/rules/hyph_te_IN.dic
@@ -0,0 +1,91 @@
+UTF-8
+% Hyphenation for Telugu
+% Copyright (C) 2008 Santhosh Thottingal <santhosh.thottingal@gmail.com>
+%
+% This library is free software; you can redistribute it and/or
+% modify it under the terms of the GNU General Public
+% License as published by the Free Software Foundation;
+% version 3 or later version of the License.
+%
+% This library is distributed in the hope that it will be useful,
+% but WITHOUT ANY WARRANTY; without even the implied warranty of
+% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+% Lesser General Public License for more details.
+%
+% You should have received a copy of the GNU General Public
+% License along with this library; if not, write to the Free Software
+% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+%
+
+అ1
+ఆ1
+ఇ1
+ఈ1
+ఉ1
+ఊ1
+ఋ1
+ఎ1
+ఏ1
+ఐ1
+ఒ1
+ఔ1
+ా1
+ి1
+ీ1
+ు1
+ూ1
+ృ1
+ె1
+ే1
+ొ1
+ో1
+ై1
+ౌ1
+్2
+ః1
+ం1
+1న
+న్2
+2న్‍
+1ర
+ర్2
+2ర్‍
+1ల
+ల్2
+2ల్‍
+1ళ
+ళ్2
+2ళ్‍
+1ణ
+ణ్2
+2ణ్‍
+1క
+1గ
+1ఖ
+1ఘ
+1ఙ
+1చ
+1ఛ
+1జ
+1ఝ
+1ఞ
+1ట
+1ఠ
+1డ
+1ఢ
+1త
+1థ
+1ద
+1ధ
+1ప
+1ఫ
+1బ
+1భ
+1మ
+1య
+1వ
+1శ
+1ష
+1స
+1హ
+1ఱ