From 8de2fcccd538d72730a4b34cf75f1b44294f8435 Mon Sep 17 00:00:00 2001 From: Santhosh Thottingal Date: Tue, 24 Mar 2009 22:56:09 +0530 Subject: Hyphenator Module for Silpa --- silpa/modules/__init__.py | 1 + silpa/modules/hyphenator/__init__.py | 2 + silpa/modules/hyphenator/rules/hyph_bn_IN.dic | 82 +++++++++++++++++++++++ silpa/modules/hyphenator/rules/hyph_gu_IN.dic | 86 +++++++++++++++++++++++++ silpa/modules/hyphenator/rules/hyph_hi_IN.dic | 92 ++++++++++++++++++++++++++ silpa/modules/hyphenator/rules/hyph_kn_IN.dic | 91 ++++++++++++++++++++++++++ silpa/modules/hyphenator/rules/hyph_ml_IN.dic | 93 +++++++++++++++++++++++++++ silpa/modules/hyphenator/rules/hyph_or_IN.dic | 85 ++++++++++++++++++++++++ silpa/modules/hyphenator/rules/hyph_pa_IN.dic | 83 ++++++++++++++++++++++++ silpa/modules/hyphenator/rules/hyph_ta_IN.dic | 77 ++++++++++++++++++++++ silpa/modules/hyphenator/rules/hyph_te_IN.dic | 91 ++++++++++++++++++++++++++ 11 files changed, 783 insertions(+) create mode 100644 silpa/modules/hyphenator/__init__.py create mode 100644 silpa/modules/hyphenator/rules/hyph_bn_IN.dic create mode 100644 silpa/modules/hyphenator/rules/hyph_gu_IN.dic create mode 100644 silpa/modules/hyphenator/rules/hyph_hi_IN.dic create mode 100644 silpa/modules/hyphenator/rules/hyph_kn_IN.dic create mode 100644 silpa/modules/hyphenator/rules/hyph_ml_IN.dic create mode 100644 silpa/modules/hyphenator/rules/hyph_or_IN.dic create mode 100644 silpa/modules/hyphenator/rules/hyph_pa_IN.dic create mode 100644 silpa/modules/hyphenator/rules/hyph_ta_IN.dic create mode 100644 silpa/modules/hyphenator/rules/hyph_te_IN.dic (limited to 'silpa') diff --git a/silpa/modules/__init__.py b/silpa/modules/__init__.py index a436dc9..4ebcec0 100644 --- a/silpa/modules/__init__.py +++ b/silpa/modules/__init__.py @@ -1,3 +1,4 @@ #! /usr/bin/env python # -*- coding: utf-8 -*- from lemmatizer import * +from hyphenator import * diff --git a/silpa/modules/hyphenator/__init__.py b/silpa/modules/hyphenator/__init__.py new file mode 100644 index 0000000..e1f7e6e --- /dev/null +++ b/silpa/modules/hyphenator/__init__.py @@ -0,0 +1,2 @@ +#! /usr/bin/env python +# -*- coding: utf-8 -*- diff --git a/silpa/modules/hyphenator/rules/hyph_bn_IN.dic b/silpa/modules/hyphenator/rules/hyph_bn_IN.dic new file mode 100644 index 0000000..52acee5 --- /dev/null +++ b/silpa/modules/hyphenator/rules/hyph_bn_IN.dic @@ -0,0 +1,82 @@ +UTF-8 +% Hyphenation for Bengali +% Copyright (C) 2008 Santhosh Thottingal +% +% This library is free software; you can redistribute it and/or +% modify it under the terms of the GNU General Public +% License as published by the Free Software Foundation; +% version 3 or later version of the License. +% +% This library is distributed in the hope that it will be useful, +% but WITHOUT ANY WARRANTY; without even the implied warranty of +% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +% Lesser General Public License for more details. +% +% You should have received a copy of the GNU General Public +% License along with this library; if not, write to the Free Software +% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA +% + +অ1 +আ1 +ই1 +ঈ1 +উ1 +ঊ1 +ঋ1 +এ1 +ঐ1 +ঔ1 +া1 +ি1 +ী1 +ু1 +ে1 +ো1 +ৈ1 +ৌ1 +ৗ1 +্2 +ঃ1 +ং1 +1ন +ন্2 +2ন্‍ +1র +র্2 +2র্‍ +1ল +ল্2 +2ল্‍ +্2 +1ণ +ণ্2 +2ণ্‍ +1ক +1গ +1খ +1ঘ +1ঙ +1চ +1ছ +1জ +1ঝ +1ঞ +1ট +1ঠ +1ড +1ঢ +1ত +1থ +1দ +1ধ +1প +1ফ +1ব +1ভ +1ম +1য +1শ +1ষ +1স +1হ diff --git a/silpa/modules/hyphenator/rules/hyph_gu_IN.dic b/silpa/modules/hyphenator/rules/hyph_gu_IN.dic new file mode 100644 index 0000000..13b9b60 --- /dev/null +++ b/silpa/modules/hyphenator/rules/hyph_gu_IN.dic @@ -0,0 +1,86 @@ +UTF-8 +% Hyphenation for Gujarati +% Copyright (C) 2008 Santhosh Thottingal +% +% This library is free software; you can redistribute it and/or +% modify it under the terms of the GNU General Public +% License as published by the Free Software Foundation; +% version 3 or later version of the License. +% +% This library is distributed in the hope that it will be useful, +% but WITHOUT ANY WARRANTY; without even the implied warranty of +% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +% Lesser General Public License for more details. +% +% You should have received a copy of the GNU General Public +% License along with this library; if not, write to the Free Software +% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA +% + +અ1 +આ1 +ઇ1 +ઈ1 +ઉ1 +ઊ1 +ઋ1 +એ1 +ઐ1 +ઔ1 +ા1 +િ1 +ી1 +ુ1 +ૂ1 +ૃ1 +ે1 +ો1 +ૈ1 +ૌ1 +્2 +ઃ1 +ં1 +1ન +ન્2 +2ન્‍ +1ર +ર્2 +2ર્‍ +1લ +લ્2 +2લ્‍ +1ળ +ળ્2 +2ળ્‍ +1ણ +ણ્2 +2ણ્‍ +1ક +1ગ +1ખ +1ઘ +1ઙ +1ચ +1છ +1જ +1ઝ +1ઞ +1ટ +1ઠ +1ડ +1ઢ +1ત +1થ +1દ +1ધ +1પ +1ફ +1બ +1ભ +1મ +1ય +1વ +1શ +1ષ +1સ +1હ diff --git a/silpa/modules/hyphenator/rules/hyph_hi_IN.dic b/silpa/modules/hyphenator/rules/hyph_hi_IN.dic new file mode 100644 index 0000000..dc82fbd --- /dev/null +++ b/silpa/modules/hyphenator/rules/hyph_hi_IN.dic @@ -0,0 +1,92 @@ +UTF-8 +% Hyphenation for Hindi +% Copyright (C) 2008 Santhosh Thottingal +% +% This library is free software; you can redistribute it and/or +% modify it under the terms of the GNU General Public +% License as published by the Free Software Foundation; +% version 3 or later version of the License. +% +% This library is distributed in the hope that it will be useful, +% but WITHOUT ANY WARRANTY; without even the implied warranty of +% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +% Lesser General Public License for more details. +% +% You should have received a copy of the GNU General Public +% License along with this library; if not, write to the Free Software +% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA +% + +अ1 +आ1 +इ1 +ई1 +उ1 +ऊ1 +ऋ1 +ऎ1 +ए1 +ऐ1 +ऒ1 +औ1 +ा1 +ि1 +ी1 +ु1 +ू1 +ृ1 +ॆ1 +े1 +ॊ1 +ो1 +ै1 +ौ1 +्2 +ः1 +ं1 +1न +न्2 +2न्‍ +1र +र्2 +2र्‍ +1ल +ल्2 +2ल्‍ +1ळ +ळ्2 +2ळ्‍ +1ण +ण्2 +2ण्‍ +1क +1ग +1ख +1घ +1ङ +1च +1छ +1ज +1झ +1ञ +1ट +1ठ +1ड +1ढ +1त +1थ +1द +1ध +1प +1फ +1ब +1भ +1म +1य +1व +1श +1ष +1स +1ह +1ऴ +1ऱ diff --git a/silpa/modules/hyphenator/rules/hyph_kn_IN.dic b/silpa/modules/hyphenator/rules/hyph_kn_IN.dic new file mode 100644 index 0000000..e241192 --- /dev/null +++ b/silpa/modules/hyphenator/rules/hyph_kn_IN.dic @@ -0,0 +1,91 @@ +UTF-8 +% Hyphenation for Kannada +% Copyright (C) 2008 Santhosh Thottingal +% +% This library is free software; you can redistribute it and/or +% modify it under the terms of the GNU General Public +% License as published by the Free Software Foundation; +% version 3 or later version of the License. +% +% This library is distributed in the hope that it will be useful, +% but WITHOUT ANY WARRANTY; without even the implied warranty of +% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +% Lesser General Public License for more details. +% +% You should have received a copy of the GNU General Public +% License along with this library; if not, write to the Free Software +% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA +% + +ಅ1 +ಆ1 +ಇ1 +ಈ1 +ಉ1 +ಊ1 +ಋ1 +ಎ1 +ಏ1 +ಐ1 +ಒ1 +ಔ1 +ಾ1 +ಿ1 +ೀ1 +ು1 +ೂ1 +ೃ1 +ೆ1 +ೇ1 +ೊ1 +ೋ1 +ೈ1 +ೌ1 +್2 +ಃ1 +ಂ1 +1ನ +ನ್2 +2ನ್‍ +1ರ +ರ್2 +2ರ್‍ +1ಲ +ಲ್2 +2ಲ್‍ +1ಳ +ಳ್2 +2ಳ್‍ +1ಣ +ಣ್2 +2ಣ್‍ +1ಕ +1ಗ +1ಖ +1ಘ +1ಙ +1ಚ +1ಛ +1ಜ +1ಝ +1ಞ +1ಟ +1ಠ +1ಡ +1ಢ +1ತ +1ಥ +1ದ +1ಧ +1ಪ +1ಫ +1ಬ +1ಭ +1ಮ +1ಯ +1ವ +1ಶ +1ಷ +1ಸ +1ಹ +1ಱ diff --git a/silpa/modules/hyphenator/rules/hyph_ml_IN.dic b/silpa/modules/hyphenator/rules/hyph_ml_IN.dic new file mode 100644 index 0000000..44b50b9 --- /dev/null +++ b/silpa/modules/hyphenator/rules/hyph_ml_IN.dic @@ -0,0 +1,93 @@ +UTF-8 +% Hyphenation for Malayalam +% Copyright (C) 2008 Santhosh Thottingal +% +% This library is free software; you can redistribute it and/or +% modify it under the terms of the GNU General Public +% License as published by the Free Software Foundation; +% version 3 or later version of the License. +% +% This library is distributed in the hope that it will be useful, +% but WITHOUT ANY WARRANTY; without even the implied warranty of +% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +% Lesser General Public License for more details. +% +% You should have received a copy of the GNU General Public +% License along with this library; if not, write to the Free Software +% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA +% + +അ1 +ആ1 +ഇ1 +ഈ1 +ഉ1 +ഊ1 +ഋ1 +എ1 +ഏ1 +ഐ1 +ഒ1 +ഔ1 +ാ1 +ി1 +ീ1 +ു1 +ൂ1 +ൃ1 +െ1 +േ1 +ൊ1 +ോ1 +ൈ1 +ൌ1 +ൗ1 +്2 +ഃ1 +2ം1 +1ന +ന്2 +2ന്‍ +1ര +ര്2 +2ര്‍ +1ല +ല്2 +2ല്‍ +1ള +ള്2 +2ള്‍ +1ണ +ണ്2 +2ണ്‍ +1ക +1ഗ +1ഖ +1ഘ +1ങ +1ച +1ഛ +1ജ +1ഝ +1ഞ +1ട +1ഠ +1ഡ +1ഢ +1ത +1ഥ +1ദ +1ധ +1പ +1ഫ +1ബ +1ഭ +1മ +1യ +1വ +1ശ +1ഷ +1സ +1ഹ +1ഴ +1റ diff --git a/silpa/modules/hyphenator/rules/hyph_or_IN.dic b/silpa/modules/hyphenator/rules/hyph_or_IN.dic new file mode 100644 index 0000000..c9ea024 --- /dev/null +++ b/silpa/modules/hyphenator/rules/hyph_or_IN.dic @@ -0,0 +1,85 @@ +UTF-8 +% Hyphenation for Oriya +% Copyright (C) 2008 Santhosh Thottingal +% +% This library is free software; you can redistribute it and/or +% modify it under the terms of the GNU General Public +% License as published by the Free Software Foundation; +% version 3 or later version of the License. +% +% This library is distributed in the hope that it will be useful, +% but WITHOUT ANY WARRANTY; without even the implied warranty of +% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +% Lesser General Public License for more details. +% +% You should have received a copy of the GNU General Public +% License along with this library; if not, write to the Free Software +% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA +% + +ଅ1 +ଆ1 +ଇ1 +ଈ1 +ଉ1 +ଊ1 +ଋ1 +ଏ1 +ଐ1 +ଔ1 +ା1 +ି1 +ୀ1 +ୁ1 +େ1 +ୋ1 +ୈ1 +ୌ1 +ୗ1 +୍2 +ଃ1 +ଂ1 +1ନ +ନ୍2 +2ନ୍‍ +1ର +ର୍2 +2ର୍‍ +1ଲ +ଲ୍2 +2ଲ୍‍ +1ଳ +ଳ୍2 +2ଳ୍‍ +1ଣ +ଣ୍2 +2ଣ୍‍ +1କ +1ଗ +1ଖ +1ଘ +1ଙ +1ଚ +1ଛ +1ଜ +1ଝ +1ଞ +1ଟ +1ଠ +1ଡ +1ଢ +1ତ +1ଥ +1ଦ +1ଧ +1ପ +1ଫ +1ବ +1ଭ +1ମ +1ଯ +1ଵ +1ଶ +1ଷ +1ସ +1ହ diff --git a/silpa/modules/hyphenator/rules/hyph_pa_IN.dic b/silpa/modules/hyphenator/rules/hyph_pa_IN.dic new file mode 100644 index 0000000..fcda980 --- /dev/null +++ b/silpa/modules/hyphenator/rules/hyph_pa_IN.dic @@ -0,0 +1,83 @@ +UTF-8 +% Hyphenation for Panjabi(Gurmughi) +% Copyright (C) 2008 Santhosh Thottingal +% +% This library is free software; you can redistribute it and/or +% modify it under the terms of the GNU General Public +% License as published by the Free Software Foundation; +% version 3 or later version of the License. +% +% This library is distributed in the hope that it will be useful, +% but WITHOUT ANY WARRANTY; without even the implied warranty of +% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +% Lesser General Public License for more details. +% +% You should have received a copy of the GNU General Public +% License along with this library; if not, write to the Free Software +% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA +% + +ਅ1 +ਆ1 +ਇ1 +ਈ1 +ਉ1 +ਊ1 +ਏ1 +ਐ1 +ਔ1 +ਾ1 +ਿ1 +ੀ1 +ੁ1 +ੂ1 +ੇ1 +ੋ1 +ੈ1 +ੌ1 +੍2 +ਃ1 +ਂ1 +1ਨ +ਨ੍2 +2ਨ੍‍ +1ਰ +ਰ੍2 +2ਰ੍‍ +1ਲ +ਲ੍2 +2ਲ੍‍ +1ਲ਼ +ਲ਼੍2 +2ਲ਼੍‍ +1ਣ +ਣ੍2 +2ਣ੍‍ +1ਕ +1ਗ +1ਖ +1ਘ +1ਙ +1ਚ +1ਛ +1ਜ +1ਝ +1ਞ +1ਟ +1ਠ +1ਡ +1ਢ +1ਤ +1ਥ +1ਦ +1ਧ +1ਪ +1ਫ +1ਬ +1ਭ +1ਮ +1ਯ +1ਵ +1ਸ਼ +1ਸ +1ਹ diff --git a/silpa/modules/hyphenator/rules/hyph_ta_IN.dic b/silpa/modules/hyphenator/rules/hyph_ta_IN.dic new file mode 100644 index 0000000..298d7d1 --- /dev/null +++ b/silpa/modules/hyphenator/rules/hyph_ta_IN.dic @@ -0,0 +1,77 @@ +UTF-8 +% Hyphenation for Tamil +% Copyright (C) 2008 Santhosh Thottingal +% +% This library is free software; you can redistribute it and/or +% modify it under the terms of the GNU General Public +% License as published by the Free Software Foundation; +% version 3 or later version of the License. +% +% This library is distributed in the hope that it will be useful, +% but WITHOUT ANY WARRANTY; without even the implied warranty of +% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +% Lesser General Public License for more details. +% +% You should have received a copy of the GNU General Public +% License along with this library; if not, write to the Free Software +% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA +% + +அ1 +ஆ1 +இ1 +ஈ1 +உ1 +ஊ1 +எ1 +ஏ1 +ஐ1 +ஒ1 +ஔ1 +ா1 +ி1 +ீ1 +ு1 +ூ1 +ெ1 +ே1 +ொ1 +ோ1 +ை1 +ௌ1 +ௗ1 +்2 +ஃ1 +ஂ1 +1ந +ந்2 +2ந்‍ +1ர +ர்2 +2ர்‍ +1ல +ல்2 +2ல்‍ +1ள +ள்2 +2ள்‍ +1ண +ண்2 +2ண்‍ +1க +1ங +1ச +1ஜ +1ஞ +1ட +1த +1ப +1ம +1ய +1வ +1ஶ +1ஷ +1ஸ +1ஹ +1ழ +1ற diff --git a/silpa/modules/hyphenator/rules/hyph_te_IN.dic b/silpa/modules/hyphenator/rules/hyph_te_IN.dic new file mode 100644 index 0000000..62ddfe2 --- /dev/null +++ b/silpa/modules/hyphenator/rules/hyph_te_IN.dic @@ -0,0 +1,91 @@ +UTF-8 +% Hyphenation for Telugu +% Copyright (C) 2008 Santhosh Thottingal +% +% This library is free software; you can redistribute it and/or +% modify it under the terms of the GNU General Public +% License as published by the Free Software Foundation; +% version 3 or later version of the License. +% +% This library is distributed in the hope that it will be useful, +% but WITHOUT ANY WARRANTY; without even the implied warranty of +% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +% Lesser General Public License for more details. +% +% You should have received a copy of the GNU General Public +% License along with this library; if not, write to the Free Software +% Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA +% + +అ1 +ఆ1 +ఇ1 +ఈ1 +ఉ1 +ఊ1 +ఋ1 +ఎ1 +ఏ1 +ఐ1 +ఒ1 +ఔ1 +ా1 +ి1 +ీ1 +ు1 +ూ1 +ృ1 +ె1 +ే1 +ొ1 +ో1 +ై1 +ౌ1 +్2 +ః1 +ం1 +1న +న్2 +2న్‍ +1ర +ర్2 +2ర్‍ +1ల +ల్2 +2ల్‍ +1ళ +ళ్2 +2ళ్‍ +1ణ +ణ్2 +2ణ్‍ +1క +1గ +1ఖ +1ఘ +1ఙ +1చ +1ఛ +1జ +1ఝ +1ఞ +1ట +1ఠ +1డ +1ఢ +1త +1థ +1ద +1ధ +1ప +1ఫ +1బ +1భ +1మ +1య +1వ +1శ +1ష +1స +1హ +1ఱ -- cgit