From 7c19f25ef4e8a18709eed13545d62c76fa299ce6 Mon Sep 17 00:00:00 2001 From: Santhosh Thottingal Date: Wed, 23 Sep 2009 21:31:03 +0530 Subject: Version 0.5 --- hyphenation/ChangeLog | 5 ++ hyphenation/hyph_as_IN.dic | 184 +++++++++++++++++------------------------- hyphenation/hyph_bn_IN.dic | 184 +++++++++++++++++------------------------- hyphenation/hyph_gu_IN.dic | 170 +++++++++++++++------------------------ hyphenation/hyph_hi_IN.dic | 179 ++++++++++++++++------------------------- hyphenation/hyph_kn_IN.dic | 186 +++++++++++++++++-------------------------- hyphenation/hyph_ml_IN.dic | 194 ++++++++++++++++++++------------------------- hyphenation/hyph_mr_IN.dic | 179 ++++++++++++++++------------------------- hyphenation/hyph_or_IN.dic | 167 +++++++++++++++----------------------- hyphenation/hyph_pa_IN.dic | 159 ++++++++++++++----------------------- hyphenation/hyph_ta_IN.dic | 122 ++++++++++++---------------- hyphenation/hyph_te_IN.dic | 184 +++++++++++++++++------------------------- 12 files changed, 761 insertions(+), 1152 deletions(-) diff --git a/hyphenation/ChangeLog b/hyphenation/ChangeLog index 41b0ad1..cf1cd46 100644 --- a/hyphenation/ChangeLog +++ b/hyphenation/ChangeLog @@ -1,5 +1,10 @@ ChangeLog -------------- +2009-08-22: Version 0.5 + * Fixed the bugs reported by Kevin for Malayalam + * For all patterns the problems with incompatibility between tex patterns and libhyphen of Openoffice fixed + * Added testcases for all languages. + 2009-08-18: Version 0.41 * Assamese hyphenation patters added. Copied from Bengali. diff --git a/hyphenation/hyph_as_IN.dic b/hyphenation/hyph_as_IN.dic index cf2a859..322d905 100755 --- a/hyphenation/hyph_as_IN.dic +++ b/hyphenation/hyph_as_IN.dic @@ -17,124 +17,84 @@ UTF-8 % Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA % % GENERAL RULE -% Do not break either side of ZERO-WIDTH JOINER -% (U+200D) and ZERO-WIDTH NON-JOINER (U+200C) +% Do not break either side of ZERO-WIDTH JOINER (U+200D) 2‍2 -2‌2 +% Break on both sides of ZERO-WIDTH NON JOINER (U+200C) +1‌1 % Break before or after any independent vowel. -1অ1 -1আ1 -1ই1 -1ঈ1 -1উ1 -1ঊ1 -1ঋ1 -1ৠ1 -1ঌ1 -1ৡ1 -1এ1 -1ঐ1 -1ও1 -1ঔ1 +অ1 +আ1 +ই1 +ঈ1 +উ1 +ঊ1 +ঋ1 +ৠ1 +ঌ1 +ৡ1 +এ1 +ঐ1 +ও1 +ঔ1 % Break after any dependent vowel, but not before. -2া1 -2ি1 -2ী1 -2ু1 -2ূ1 -2ৃ1 -2ৄ1 -2ৢ1 -2ৣ1 -2ে1 -2ৈ1 -2ো1 -2ৌ1 +া1 +ি1 +ী1 +ু1 +ূ1 +ৃ1 +ৄ1 +ৢ1 +ৣ1 +ে1 +ৈ1 +ো1 +ৌ1 +2়2 +ৗ1 % Break before or after any consonant. -1ক1 -1খ1 -1গ1 -1ঘ1 -1ঙ1 -1চ1 -1ছ1 -1জ1 -1ঝ1 -1ঞ1 -1ট1 -1ঠ1 -1ড1 -1ড়1 -1ঢ1 -1ঢ়1 -1ণ1 -1ত1 -1থ1 -1দ1 -1ধ1 -1ন1 -1প1 -1ফ1 -1ব1 -1ভ1 -1ম1 -1য1 -1য়1 -1র1 -1ল1 -1শ1 -1ষ1 -1স1 -1হ1 +1ক +1খ +1গ +1ঘ +1ঙ +1চ +1ছ +1জ +1ঝ +1ঞ +1ট +1ঠ +1ড +1ড় +1ঢ +1ঢ় +1ণ +1ত +1থ +1দ +1ধ +1ন +1প +1ফ +1ব +1ভ +1ম +1য +1য় +1র +1ল +1শ +1ষ +1স +1হ % Do not break after khanda ta. -1ৎ2 -% Do not break before a final consonant or conjunct. -2ক্. -2খ্. -2গ্. -2ঘ্. -2ঙ্. -2চ্. -2ছ্. -2জ্. -2ঝ্. -2ঞ্. -2ট্. -2ঠ্. -2ড্. -2ড়্. -2ঢ্. -2ঢ়্. -2ণ্. -2ত্. -2থ্. -2দ্. -2ধ্. -2ন্. -2প্. -2ফ্. -2ব্. -2ভ্. -2ম্. -2য্. -2য়্. -2র্. -2ল্. -2শ্. -2ষ্. -2স্. -2হ্. -2র্ক. -2র্ট. -2র্ত. -2র্প. +ৎ1 % Do not break before chandrabindu, anusvara, visarga, avagraha, % nukta and au length mark. -2ঁ -2ং -2ঃ -2ঽ -2় -2ৗ +2ঃ1 +2ং1 +2ঁ1 +2ঽ1 % Do not break either side of virama (may be within conjunct). 2্2 diff --git a/hyphenation/hyph_bn_IN.dic b/hyphenation/hyph_bn_IN.dic index 45ed3ba..a6842cc 100755 --- a/hyphenation/hyph_bn_IN.dic +++ b/hyphenation/hyph_bn_IN.dic @@ -17,124 +17,84 @@ UTF-8 % Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA % % GENERAL RULE -% Do not break either side of ZERO-WIDTH JOINER -% (U+200D) and ZERO-WIDTH NON-JOINER (U+200C) +% Do not break either side of ZERO-WIDTH JOINER (U+200D) 2‍2 -2‌2 +% Break on both sides of ZERO-WIDTH NON JOINER (U+200C) +1‌1 % Break before or after any independent vowel. -1অ1 -1আ1 -1ই1 -1ঈ1 -1উ1 -1ঊ1 -1ঋ1 -1ৠ1 -1ঌ1 -1ৡ1 -1এ1 -1ঐ1 -1ও1 -1ঔ1 +অ1 +আ1 +ই1 +ঈ1 +উ1 +ঊ1 +ঋ1 +ৠ1 +ঌ1 +ৡ1 +এ1 +ঐ1 +ও1 +ঔ1 % Break after any dependent vowel, but not before. -2া1 -2ি1 -2ী1 -2ু1 -2ূ1 -2ৃ1 -2ৄ1 -2ৢ1 -2ৣ1 -2ে1 -2ৈ1 -2ো1 -2ৌ1 +া1 +ি1 +ী1 +ু1 +ূ1 +ৃ1 +ৄ1 +ৢ1 +ৣ1 +ে1 +ৈ1 +ো1 +ৌ1 +2়2 +ৗ1 % Break before or after any consonant. -1ক1 -1খ1 -1গ1 -1ঘ1 -1ঙ1 -1চ1 -1ছ1 -1জ1 -1ঝ1 -1ঞ1 -1ট1 -1ঠ1 -1ড1 -1ড়1 -1ঢ1 -1ঢ়1 -1ণ1 -1ত1 -1থ1 -1দ1 -1ধ1 -1ন1 -1প1 -1ফ1 -1ব1 -1ভ1 -1ম1 -1য1 -1য়1 -1র1 -1ল1 -1শ1 -1ষ1 -1স1 -1হ1 +1ক +1খ +1গ +1ঘ +1ঙ +1চ +1ছ +1জ +1ঝ +1ঞ +1ট +1ঠ +1ড +1ড় +1ঢ +1ঢ় +1ণ +1ত +1থ +1দ +1ধ +1ন +1প +1ফ +1ব +1ভ +1ম +1য +1য় +1র +1ল +1শ +1ষ +1স +1হ % Do not break after khanda ta. -1ৎ2 -% Do not break before a final consonant or conjunct. -2ক্. -2খ্. -2গ্. -2ঘ্. -2ঙ্. -2চ্. -2ছ্. -2জ্. -2ঝ্. -2ঞ্. -2ট্. -2ঠ্. -2ড্. -2ড়্. -2ঢ্. -2ঢ়্. -2ণ্. -2ত্. -2থ্. -2দ্. -2ধ্. -2ন্. -2প্. -2ফ্. -2ব্. -2ভ্. -2ম্. -2য্. -2য়্. -2র্. -2ল্. -2শ্. -2ষ্. -2স্. -2হ্. -2র্ক. -2র্ট. -2র্ত. -2র্প. +ৎ1 % Do not break before chandrabindu, anusvara, visarga, avagraha, % nukta and au length mark. -2ঁ -2ং -2ঃ -2ঽ -2় -2ৗ +2ঃ1 +2ং1 +2ঁ1 +2ঽ1 % Do not break either side of virama (may be within conjunct). 2্2 diff --git a/hyphenation/hyph_gu_IN.dic b/hyphenation/hyph_gu_IN.dic index d42149f..9b0b80c 100755 --- a/hyphenation/hyph_gu_IN.dic +++ b/hyphenation/hyph_gu_IN.dic @@ -17,115 +17,77 @@ UTF-8 % Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA % % GENERAL RULE -% Do not break either side of ZERO-WIDTH JOINER -% (U+200D) and ZERO-WIDTH NON-JOINER (U+200C) +% Do not break either side of ZERO-WIDTH JOINER (U+200D) 2‍2 -2‌2 +% Break on both sides of ZERO-WIDTH NON JOINER (U+200C) +1‌1 % Break before or after any independent vowel. -1અ1 -1આ1 -1ઇ1 -1ઈ1 -1ઉ1 -1ઊ1 -1ઋ1 -1ૠ1 -1એ1 -1ઐ1 -1ઓ1 -1ઔ1 +અ1 +આ1 +ઇ1 +ઈ1 +ઉ1 +ઊ1 +ઋ1 +ૠ1 +એ1 +ઐ1 +ઓ1 +ઔ1 % Break after any dependent vowel but not before. -2ા1 -2િ1 -2ી1 -2ુ1 -2ૂ1 -2ૃ1 -2ૄ1 -2ૢ1 -2ૣ1 -2ે1 -2ૈ1 -2ો1 -2ૌ1 +ા1 +િ1 +ી1 +ુ1 +ૂ1 +ૃ1 +ૄ1 +ૢ1 +ૣ1 +ે1 +ૈ1 +ો1 +ૌ1 % Break before or after any consonant. -1ક1 -1ખ1 -1ગ1 -1ઘ1 -1ઙ1 -1ચ1 -1છ1 -1જ1 -1ઝ1 -1ઞ1 -1ટ1 -1ઠ1 -1ડ1 -1ઢ1 -1ણ1 -1ત1 -1થ1 -1દ1 -1ધ1 -1ન1 -1પ1 -1ફ1 -1બ1 -1ભ1 -1મ1 -1ય1 -1ર1 -1લ1 -1ળ1 -1વ1 -1શ1 -1ષ1 -1સ1 -1હ1 -% Do not break before a final consonant or conjunct. -2ક્. -2ખ્. -2ગ્. -2ઘ્. -2ઙ્. -2ચ્. -2છ્. -2જ્. -2ઝ્. -2ઞ્. -2ટ્. -2ઠ્. -2ડ્. -2ઢ્. -2ણ્. -2ત્. -2થ્. -2દ્. -2ધ્. -2ન્. -2પ્. -2ફ્. -2બ્. -2ભ્. -2મ્. -2ય્. -2ર્. -2લ્. -2ળ્. -2વ્. -2શ્. -2ષ્. -2સ્. -2હ્. -2ર્ક્. -2ર્ટ્. -2ર્ત્. -2ર્પ્. +1ક +1ખ +1ગ +1ઘ +1ઙ +1ચ +1છ +1જ +1ઝ +1ઞ +1ટ +1ઠ +1ડ +1ઢ +1ણ +1ત +1થ +1દ +1ધ +1ન +1પ +1ફ +1બ +1ભ +1મ +1ય +1ર +1લ +1ળ +1વ +1શ +1ષ +1સ +1હ % Do not break before chandrabindu, anusvara, visarga, avagraha % and accents. -2ઁ -2ઃ -2ઽ +2ઁ1 +2ઃ1 +2ઽ1 % Do not break either side of virama (may be within conjunct). 2્2 +2ં2 diff --git a/hyphenation/hyph_hi_IN.dic b/hyphenation/hyph_hi_IN.dic index 985eeaf..a0c7518 100755 --- a/hyphenation/hyph_hi_IN.dic +++ b/hyphenation/hyph_hi_IN.dic @@ -17,120 +17,81 @@ UTF-8 % Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA % % GENERAL RULE -% Do not break either side of ZERO-WIDTH JOINER -% (U+200D) and ZERO-WIDTH NON-JOINER (U+200C) +% Do not break either side of ZERO-WIDTH JOINER (U+200D) 2‍2 -2‌2 +% Break on both sides of ZERO-WIDTH NON JOINER (U+200C) +1‌1 % Break before or after any independent vowel. -1अ1 -1आ1 -1इ1 -1ई1 -1उ1 -1ऊ1 -1ऋ1 -1ॠ1 -1ऌ1 -1ॡ1 -1ए1 -1ऐ1 -1ओ1 -1औ1 +अ1 +आ1 +इ1 +ई1 +उ1 +ऊ1 +ऋ1 +ॠ1 +ऌ1 +ॡ1 +ए1 +ऐ1 +ओ1 +औ1 % Break after any dependent vowel but not before. -2ा1 -2ि1 -2ी1 -2ु1 -2ू1 -2ृ1 -2ॄ1 -2ॢ1 -2ॣ1 -2े1 -2ै1 -2ो1 -2ौ1 +ा1 +ि1 +ी1 +ु1 +ू1 +ृ1 +ॄ1 +ॢ1 +ॣ1 +े1 +ै1 +ो1 +ौ1 % Break before or after any consonant. -1क1 -1ख1 -1ग1 -1घ1 -1ङ1 -1च1 -1छ1 -1ज1 -1झ1 -1ञ1 -1ट1 -1ठ1 -1ड1 -1ढ1 -1ण1 -1त1 -1थ1 -1द1 -1ध1 -1न1 -1प1 -1फ1 -1ब1 -1भ1 -1म1 -1य1 -1र1 -1ल1 -1ळ1 -1व1 -1श1 -1ष1 -1स1 -1ह1 -% Do not break before a final consonant or conjunct. -2क्. -2ख्. -2ग्. -2घ्. -2ङ्. -2च्. -2छ्. -2ज्. -2झ्. -2ञ्. -2ट्. -2ठ्. -2ड्. -2ढ्. -2ण्. -2त्. -2थ्. -2द्. -2ध्. -2न्. -2प्. -2फ्. -2ब्. -2भ्. -2म्. -2य्. -2र्. -2ल्. -2ळ्. -2व्. -2श्. -2ष्. -2स्. -2ह्. -2र्क्. -2र्ट्. -2र्त्. -2र्प्. +1क +1ख +1ग +1घ +1ङ +1च +1छ +1ज +1झ +1ञ +1ट +1ठ +1ड +1ढ +1ण +1त +1थ +1द +1ध +1न +1प +1फ +1ब +1भ +1म +1य +1र +1ल +1ळ +1व +1श +1ष +1स +1ह % Do not break before chandrabindu, anusvara, visarga, avagraha % and accents. -2ँ -2ं -2ः -2ऽ -2॑ -2॒ +2ँ1 +2ं1 +2ः1 +2ऽ1 +2॑1 +2॒1 % Do not break either side of virama (may be within conjunct). 2्2 diff --git a/hyphenation/hyph_kn_IN.dic b/hyphenation/hyph_kn_IN.dic index ebd0b04..fa358c3 100755 --- a/hyphenation/hyph_kn_IN.dic +++ b/hyphenation/hyph_kn_IN.dic @@ -17,124 +17,84 @@ UTF-8 % Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA % % GENERAL RULE -% Do not break either side of ZERO-WIDTH JOINER -% (U+200D) and ZERO-WIDTH NON-JOINER (U+200C) +% Do not break either side of ZERO-WIDTH JOINER (U+200D) 2‍2 -2‌2 +% Break on both sides of ZERO-WIDTH NON JOINER (U+200C) +1‌1 % Break before or after any independent vowel. -1ಅ1 -1ಆ1 -1ಇ1 -1ಈ1 -1ಉ1 -1ಊ1 -1ಋ1 -1ೠ1 -1ಌ1 -1ೡ1 -1ಎ1 -1ಏ1 -1ಐ1 -1ಒ1 -1ಓ1 -1ಔ1 +ಅ1 +ಆ1 +ಇ1 +ಈ1 +ಉ1 +ಊ1 +ಋ1 +ೠ1 +ಌ1 +ೡ1 +ಎ1 +ಏ1 +ಐ1 +ಒ1 +ಓ1 +ಔ1 % Break after any dependent vowel, but not before. -2ಾ1 -2ಿ1 -2ೀ1 -2ು1 -2ೂ1 -2ೃ1 -2ೄ1 -2ೆ1 -2ೇ1 -2ೈ1 -2ೊ1 -2ೋ1 -2ೌ1 +ಾ1 +ಿ1 +ೀ1 +ು1 +ೂ1 +ೃ1 +ೄ1 +ೆ1 +ೇ1 +ೈ1 +ೊ1 +ೋ1 +ೌ1 % Break before or after any consonant. -1ಕ1 -1ಖ1 -1ಗ1 -1ಘ1 -1ಙ1 -1ಚ1 -1ಛ1 -1ಜ1 -1ಝ1 -1ಞ1 -1ಟ1 -1ಠ1 -1ಡ1 -1ಢ1 -1ಣ1 -1ತ1 -1ಥ1 -1ದ1 -1ಧ1 -1ನ1 -1ಪ1 -1ಫ1 -1ಬ1 -1ಭ1 -1ಮ1 -1ಯ1 -1ರ1 -1ಱ1 % can occur in Sanskrit? -1ಲ1 -1ಳ1 -1ೞ1 % can occur in Sanskrit? -1ವ1 -1ಶ1 -1ಷ1 -1ಸ1 -1ಹ1 -% Do not break before a final consonant or conjunct. -2ಕ್. -2ಖ್. -2ಗ್. -2ಘ್. -2ಙ್. -2ಚ್. -2ಛ್. -2ಜ್. -2ಝ್. -2ಞ್. -2ಟ್. -2ಠ್. -2ಡ್. -2ಢ್. -2ಣ್. -2ತ್. -2ಥ್. -2ದ್. -2ಧ್. -2ನ್. -2ಪ್. -2ಫ್. -2ಬ್. -2ಭ್. -2ಮ್. -2ಯ್. -2ರ್. -2ಱ್. -2ಲ್. -2ಳ್. -2ವ್. -2ಶ್. -2ಷ್. -2ಸ್. -2ಹ್. -2ರ್ಕ. -2ರ್ಟ. -2ರ್ತ. -2ರ್ಪ. +1ಕ +1ಖ +1ಗ +1ಘ +1ಙ +1ಚ +1ಛ +1ಜ +1ಝ +1ಞ +1ಟ +1ಠ +1ಡ +1ಢ +1ಣ +1ತ +1ಥ +1ದ +1ಧ +1ನ +1ಪ +1ಫ +1ಬ +1ಭ +1ಮ +1ಯ +1ರ +1ಱ +1ಲ +1ಳ +1ೞ +1ವ +1ಶ +1ಷ +1ಸ +1ಹ % Do not break before anusvara, visarga, avagraha, % length mark and ai length mark. -2ಂ -2ಃ -2ಽ -2ೕ -2ೖ +2ಂ1 +2ಃ1 +2ಽ1 +2ೕ1 +2ೖ1 % Do not break either side of virama (may be within conjunct). 2್2 diff --git a/hyphenation/hyph_ml_IN.dic b/hyphenation/hyph_ml_IN.dic index 5836fe4..d33a26a 100755 --- a/hyphenation/hyph_ml_IN.dic +++ b/hyphenation/hyph_ml_IN.dic @@ -17,125 +17,99 @@ UTF-8 % Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA % % GENERAL RULE -% Do not break either side of ZERO-WIDTH JOINER -% (U+200D) and ZERO-WIDTH NON-JOINER (U+200C) +% Do not break either side of ZERO-WIDTH JOINER (U+200D) 2‍2 -2‌2 +% Break on both sides of ZERO-WIDTH NON JOINER (U+200C) +1‌1 % Break before or after any independent vowel. -1അ1 -1ആ1 -1ഇ1 -1ഈ1 -1ഉ1 -1ഊ1 -1ഋ1 -1ൠ1 -1ഌ1 -1ൡ1 -1എ1 -1ഏ1 -1ഐ1 -1ഒ1 -1ഓ1 -1ഔ1 +അ1 +ആ1 +ഇ1 +ഈ1 +ഉ1 +ഊ1 +ഋ1 +ൠ1 +ഌ1 +ൡ1 +എ1 +ഏ1 +ഐ1 +ഒ1 +ഓ1 +ഔ1 % Break after any dependent vowel, but not before. -2ാ1 -2ി1 -2ീ1 -2ു1 -2ൂ1 -2ൃ1 -2െ1 -2േ1 -2ൈ1 -2ൊ1 -2ോ1 -2ൌ1 +ാ1 +ി1 +ീ1 +ു1 +ൂ1 +ൃ1 +െ1 +േ1 +ൈ1 +ൊ1 +ോ1 +ൌ1 +ൗ1 % Break before or after any consonant. -1ക1 -1ഖ1 -1ഗ1 -1ഘ1 -1ങ1 -1ച1 -1ഛ1 -1ജ1 -1ഝ1 -1ഞ1 -1ട1 -1ഠ1 -1ഡ1 -1ഢ1 -1ണ1 -1ത1 -1ഥ1 -1ദ1 -1ധ1 -1ന1 -1പ1 -1ഫ1 -1ബ1 -1ഭ1 -1മ1 -1യ1 -1ര1 -1റ1 -1ല1 -1ള1 -1ഴ1 -1വ1 -1ശ1 -1ഷ1 -1സ1 -1ഹ1 -% Do not break before a final consonant or conjunct. -2ക്. -2ഖ്. -2ഗ്. -2ഘ്. -2ങ്. -2ച്. -2ഛ്. -2ജ്. -2ഝ്. -2ഞ്. -2ട്. -2ഠ്. -2ഡ്. -2ഢ്. -2ണ്. -2ത്. -2ഥ്. -2ദ്. -2ധ്. -2ന്. -2പ്. -2ഫ്. -2ബ്. -2ഭ്. -2മ്. -2യ്. -2ര്. -2റ്. -2ല്. -2ള്. -2ഴ്. -2വ്. -2ശ്. -2ഷ്. -2സ്. -2ഹ്. -% Do not break before anusvara, visarga and length mark. -2ം -2ഃ -2ൗ +1ക +1ഖ +1ഗ +1ഘ +1ങ +1ച +1ഛ +1ജ +1ഝ +1ഞ +1ട +1ഠ +1ഡ +1ഢ +1ണ +1ത +1ഥ +1ദ +1ധ +1ന +1പ +1ഫ +1ബ +1ഭ +1മ +1യ +1ര +1റ +1ല +1ള +1ഴ +1വ +1ശ +1ഷ +1സ +1ഹ +% Do not break before anusvara, visarga +2ഃ1 +2ം1 % Do not break either side of virama (may be within conjunct). 2്2 % Do not break left side of chillu +ന്2 +ര്2 +ള്2 +ല്2 +ക്2 +ണ്2 +2ന്‍ 2ല്‍ 2ള്‍ -2ന്‍ 2ണ്‍ 2ര്‍ 2ക്‍ - +2ൺ +2ൻ +2ർ +2ൽ +2ൾ +2ൿ diff --git a/hyphenation/hyph_mr_IN.dic b/hyphenation/hyph_mr_IN.dic index e0eb801..3e98bfa 100755 --- a/hyphenation/hyph_mr_IN.dic +++ b/hyphenation/hyph_mr_IN.dic @@ -17,120 +17,81 @@ UTF-8 % Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA % % GENERAL RULE -% Do not break either side of ZERO-WIDTH JOINER -% (U+200D) and ZERO-WIDTH NON-JOINER (U+200C) +% Do not break either side of ZERO-WIDTH JOINER (U+200D) 2‍2 -2‌2 +% Break on both sides of ZERO-WIDTH NON JOINER (U+200C) +1‌1 % Break before or after any independent vowel. -1अ1 -1आ1 -1इ1 -1ई1 -1उ1 -1ऊ1 -1ऋ1 -1ॠ1 -1ऌ1 -1ॡ1 -1ए1 -1ऐ1 -1ओ1 -1औ1 +अ1 +आ1 +इ1 +ई1 +उ1 +ऊ1 +ऋ1 +ॠ1 +ऌ1 +ॡ1 +ए1 +ऐ1 +ओ1 +औ1 % Break after any dependent vowel but not before. -2ा1 -2ि1 -2ी1 -2ु1 -2ू1 -2ृ1 -2ॄ1 -2ॢ1 -2ॣ1 -2े1 -2ै1 -2ो1 -2ौ1 +ा1 +ि1 +ी1 +ु1 +ू1 +ृ1 +ॄ1 +ॢ1 +ॣ1 +े1 +ै1 +ो1 +ौ1 % Break before or after any consonant. -1क1 -1ख1 -1ग1 -1घ1 -1ङ1 -1च1 -1छ1 -1ज1 -1झ1 -1ञ1 -1ट1 -1ठ1 -1ड1 -1ढ1 -1ण1 -1त1 -1थ1 -1द1 -1ध1 -1न1 -1प1 -1फ1 -1ब1 -1भ1 -1म1 -1य1 -1र1 -1ल1 -1ळ1 -1व1 -1श1 -1ष1 -1स1 -1ह1 -% Do not break before a final consonant or conjunct. -2क्. -2ख्. -2ग्. -2घ्. -2ङ्. -2च्. -2छ्. -2ज्. -2झ्. -2ञ्. -2ट्. -2ठ्. -2ड्. -2ढ्. -2ण्. -2त्. -2थ्. -2द्. -2ध्. -2न्. -2प्. -2फ्. -2ब्. -2भ्. -2म्. -2य्. -2र्. -2ल्. -2ळ्. -2व्. -2श्. -2ष्. -2स्. -2ह्. -2र्क्. -2र्ट्. -2र्त्. -2र्प्. +1क +1ख +1ग +1घ +1ङ +1च +1छ +1ज +1झ +1ञ +1ट +1ठ +1ड +1ढ +1ण +1त +1थ +1द +1ध +1न +1प +1फ +1ब +1भ +1म +1य +1र +1ल +1ळ +1व +1श +1ष +1स +1ह % Do not break before chandrabindu, anusvara, visarga, avagraha % and accents. -2ँ -2ं -2ः -2ऽ -2॑ -2॒ +2ँ1 +2ं1 +2ः1 +2ऽ1 +2॑1 +2॒1 % Do not break either side of virama (may be within conjunct). 2्2 diff --git a/hyphenation/hyph_or_IN.dic b/hyphenation/hyph_or_IN.dic index 09e1fbf..7d73740 100755 --- a/hyphenation/hyph_or_IN.dic +++ b/hyphenation/hyph_or_IN.dic @@ -17,111 +17,76 @@ UTF-8 % Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA % % GENERAL RULE -% Do not break either side of ZERO-WIDTH JOINER -% (U+200D) and ZERO-WIDTH NON-JOINER (U+200C) +% Do not break either side of ZERO-WIDTH JOINER (U+200D) 2‍2 -2‌2 +% Break on both sides of ZERO-WIDTH NON JOINER (U+200C) +1‌1 % Break before or after any independent vowel. -1ଅ1 -1ଆ1 -1ଇ1 -1ଈ1 -1ଉ1 -1ଊ1 -1ଋ1 -1ୠ1 -1ଌ1 -1ୡ1 -1ଏ1 -1ଐ1 -1ଓ1 -1ଔ1 +ଅ1 +ଆ1 +ଇ1 +ଈ1 +ଉ1 +ଊ1 +ଋ1 +ୠ1 +ଌ1 +ୡ1 +ଏ1 +ଐ1 +ଓ1 +ଔ1 % Break after any dependent vowel, but not before. -2ା1 -2ି1 -2ୀ1 -2ୁ1 -2ୂ1 -2ୃ1 -2େ1 -2ୈ1 -2ୋ1 -2ୌ1 +ା1 +ି1 +ୀ1 +ୁ1 +ୂ1 +ୃ1 +େ1 +ୈ1 +ୋ1 +ୌ1 % Break before or after any consonant. -1କ1 -1ଖ1 -1ଗ1 -1ଘ1 -1ଙ1 -1ଚ1 -1ଛ1 -1ଜ1 -1ଝ1 -1ଞ1 -1ଟ1 -1ଠ1 -1ଡ1 -1ଢ1 -1ଣ1 -1ତ1 -1ଥ1 -1ଦ1 -1ଧ1 -1ନ1 -1ପ1 -1ଫ1 -1ବ1 -1ଭ1 -1ମ1 -1ଯ1 -1ର1 -1ଲ1 -1ଳ1 -1ଵ1 -1ଶ1 -1ଷ1 -1ସ1 -1ହ1 -% Do not break before a final consonant or conjunct. -2କ୍. -2ଖ୍. -2ଗ୍. -2ଘ୍. -2ଙ୍. -2ଚ୍. -2ଛ୍. -2ଜ୍. -2ଝ୍. -2ଞ୍. -2ଟ୍. -2ଠ୍. -2ଡ୍. -2ଢ୍. -2ଣ୍. -2ତ୍. -2ଥ୍. -2ଦ୍. -2ଧ୍. -2ନ୍. -2ପ୍. -2ଫ୍. -2ବ୍. -2ଭ୍. -2ମ୍. -2ଯ୍. -2ର୍. -2୍. -2ଲ୍. -2ଳ୍. -2୍. -2ଵ୍. -2ଶ୍. -2ଷ୍. -2ସ୍. -2ହ୍. +1କ +1ଖ +1ଗ +1ଘ +1ଙ +1ଚ +1ଛ +1ଜ +1ଝ +1ଞ +1ଟ +1ଠ +1ଡ +1ଢ +1ଣ +1ତ +1ଥ +1ଦ +1ଧ +1ନ +1ପ +1ଫ +1ବ +1ଭ +1ମ +1ଯ +1ର +1ଲ +1ଳ +1ଵ +1ଶ +1ଷ +1ସ +1ହ % Do not break before anusvara, visarga and length mark. -2ଂ -2ଃ -2ୗ +2ଂ1 +2ଃ1 +2ୗ1 +2ଁ1 % Do not break either side of virama (may be within conjunct). 2୍2 + diff --git a/hyphenation/hyph_pa_IN.dic b/hyphenation/hyph_pa_IN.dic index 14211fe..f7643c4 100755 --- a/hyphenation/hyph_pa_IN.dic +++ b/hyphenation/hyph_pa_IN.dic @@ -17,109 +17,72 @@ UTF-8 % Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA % % GENERAL RULE -% Do not break either side of ZERO-WIDTH JOINER -% (U+200D) and ZERO-WIDTH NON-JOINER (U+200C) +% GENERAL RULE +% Do not break either side of ZERO-WIDTH JOINER (U+200D) 2‍2 -2‌2 +% Break on both sides of ZERO-WIDTH NON JOINER (U+200C) +1‌1 % Break before or after any independent vowel. -1ਅ1 -1ਆ1 -1ਇ1 -1ਈ1 -1ਉ1 -1ਊ1 -1ਏ1 -1ਐ1 -1ਓ1 -1ਔ1 +ਅ1 +ਆ1 +ਇ1 +ਈ1 +ਉ1 +ਊ1 +ਏ1 +ਐ1 +ਓ1 +ਔ1 % Break after any dependent vowel but not before. -2ਾ1 -2ਿ1 -2ੀ1 -2ੁ1 -2ੂ1 -2ੇ1 -2ੈ1 -2ੋ1 -2ੌ1 +ਾ1 +ਿ1 +ੀ1 +ੁ1 +ੂ1 +ੇ1 +ੈ1 +ੋ1 +ੌ1 % Break before or after any consonant. -1ਕ1 -1ਖ1 -1ਗ1 -1ਘ1 -1ਙ1 -1ਚ1 -1ਛ1 -1ਜ1 -1ਝ1 -1ਞ1 -1ਟ1 -1ਠ1 -1ਡ1 -1ਢ1 -1ਣ1 -1ਤ1 -1ਥ1 -1ਦ1 -1ਧ1 -1ਨ1 -1ਪ1 -1ਫ1 -1ਬ1 -1ਭ1 -1ਮ1 -1ਯ1 -1ਰ1 -1ਲ1 -1ਲ਼1 -1ਵ1 -1ਸ਼1 -11 -1ਸ1 -1ਹ1 -% Do not break before a final consonant or conjunct. -2ਕ੍. -2ਖ੍. -2ਗ੍. -2ਘ੍. -2ਙ੍. -2ਚ੍. -2ਛ੍. -2ਜ੍. -2ਝ੍. -2ਞ੍. -2ਟ੍. -2ਠ੍. -2ਡ੍. -2ਢ੍. -2ਣ੍. -2ਤ੍. -2ਥ੍. -2ਦ੍. -2ਧ੍. -2ਨ੍. -2ਪ੍. -2ਫ੍. -2ਬ੍. -2ਭ੍. -2ਮ੍. -2ਯ੍. -2ਰ੍. -2ਲ੍. -2ਲ਼੍. -2ਵ੍. -2ਸ਼੍. -2੍. -2ਸ੍. -2ਹ੍. -2ਰ੍ਕ੍. -2ਰ੍ਟ੍. -2ਰ੍ਤ੍. -2ਰ੍ਪ੍. +1ਕ +1ਖ +1ਗ +1ਘ +1ਙ +1ਚ +1ਛ +1ਜ +1ਝ +1ਞ +1ਟ +1ਠ +1ਡ +1ਢ +1ਣ +1ਤ +1ਥ +1ਦ +1ਧ +1ਨ +1ਪ +1ਫ +1ਬ +1ਭ +1ਮ +1ਯ +1ਰ +1ਲ +1ਲ਼ +1ਵ +1ਸ਼ +1ਸ +1ਹ % Do not break before chandrabindu, anusvara, visarga, avagraha % and accents. -2ਁ -2ਂ -2ਃ +2ਁ1 +2ਂ1 +2ਃ1 % Do not break either side of virama (may be within conjunct). 2੍2 +2ੰ2 +2ੱ2 diff --git a/hyphenation/hyph_ta_IN.dic b/hyphenation/hyph_ta_IN.dic index 9a5c889..65bf2fa 100755 --- a/hyphenation/hyph_ta_IN.dic +++ b/hyphenation/hyph_ta_IN.dic @@ -17,82 +17,60 @@ UTF-8 % Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA % % GENERAL RULE -% Do not break either side of ZERO-WIDTH JOINER -% (U+200D) and ZERO-WIDTH NON-JOINER (U+200C) +% Do not break either side of ZERO-WIDTH JOINER (U+200D) 2‍2 -2‌2 +% Break on both sides of ZERO-WIDTH NON JOINER (U+200C) +1‌1 % Break before or after any independent vowel. -1அ1 -1ஆ1 -1இ1 -1ஈ1 -1உ1 -1ஊ1 -1எ1 -1ஏ1 -1ஐ1 -1ஒ1 -1ஓ1 -1ஔ1 +அ1 +ஆ1 +இ1 +ஈ1 +உ1 +ஊ1 +எ1 +ஏ1 +ஐ1 +ஒ1 +ஓ1 +ஔ1 % Break after any dependent vowel, but not before. -2ா1 -2ி1 -2ீ1 -2ு1 -2ூ1 -2ெ1 -2ே1 -2ை1 -2ொ1 -2ோ1 -2ௌ1 +ா1 +ி1 +ீ1 +ு1 +ூ1 +ெ1 +ே1 +ை1 +ொ1 +ோ1 +ௌ1 % Break before or after any consonant. -1க1 -1ங1 -1ச1 -1ஜ1 -1ஞ1 -1ட1 -1ண1 -1த1 -1ந1 -1ப1 -1ம1 -1ய1 -1ர1 -1ற1 -1ல1 -1ள1 -1ழ1 -1வ1 -1ஷ1 -1ஸ1 -1ஹ1 -% Do not break before a final consonant or conjunct. -2க். -2ங். -2ச். -2ஜ். -2ஞ். -2ட். -2ண். -2த். -2ந். -2ப். -2ம். -2ய். -2ர். -2ற். -2ல். -2ள். -2ழ். -2வ். -2ஷ். -2ஸ். -2ஹ். +1க +1ங +1ச +1ஜ +1ஞ +1ட +1ண +1த +1ந +1ப +1ம +1ய +1ர +1ற +1ல +1ள +1ழ +1வ +1ஷ +1ஸ +1ஹ % Do not break before anusvara, visarga and length mark. -2ஂ -2ஃ -2ௗ +2ஂ1 +2ஃ1 +2ௗ1 % Do not break either side of virama (may be within conjunct). 2்2 diff --git a/hyphenation/hyph_te_IN.dic b/hyphenation/hyph_te_IN.dic index 8e4b725..ef3ca2e 100755 --- a/hyphenation/hyph_te_IN.dic +++ b/hyphenation/hyph_te_IN.dic @@ -17,123 +17,83 @@ UTF-8 % Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA % % GENERAL RULE -% Do not break either side of ZERO-WIDTH JOINER -% (U+200D) and ZERO-WIDTH NON-JOINER (U+200C) +% Do not break either side of ZERO-WIDTH JOINER (U+200D) 2‍2 -2‌2 +% Break on both sides of ZERO-WIDTH NON JOINER (U+200C) +1‌1 % Break before or after any independent vowel. -1అ1 -1ఆ1 -1ఇ1 -1ఈ1 -1ఉ1 -1ఊ1 -1ఋ1 -1ౠ1 -1ఌ1 -1ౡ1 -1ఎ1 -1ఏ1 -1ఐ1 -1ఒ1 -1ఓ1 -1ఔ1 +అ1 +ఆ1 +ఇ1 +ఈ1 +ఉ1 +ఊ1 +ఋ1 +ౠ1 +ఌ1 +ౡ1 +ఎ1 +ఏ1 +ఐ1 +ఒ1 +ఓ1 +ఔ1 % Break after any dependent vowel, but not before. -2ా1 -2ి1 -2ీ1 -2ు1 -2ూ1 -2ృ1 -2ౄ1 -2ె1 -2ే1 -2ై1 -2ొ1 -2ో1 -2ౌ1 +ా1 +ి1 +ీ1 +ు1 +ూ1 +ృ1 +ౄ1 +ె1 +ే1 +ై1 +ొ1 +ో1 +ౌ1 % Break before or after any consonant. -1క1 -1ఖ1 -1గ1 -1ఘ1 -1ఙ1 -1చ1 -1ఛ1 -1జ1 -1ఝ1 -1ఞ1 -1ట1 -1ఠ1 -1డ1 -1ఢ1 -1ణ1 -1త1 -1థ1 -1ద1 -1ధ1 -1న1 -1ప1 -1ఫ1 -1బ1 -1భ1 -1మ1 -1య1 -1ర1 -1ఱ1 % can occur in Sanskrit? -1ల1 -1ళ1 -1వ1 -1శ1 -1ష1 -1స1 -1హ1 -% Do not break before a final consonant or conjunct. -2క్. -2ఖ్. -2గ్. -2ఘ్. -2ఙ్. -2చ్. -2ఛ్. -2జ్. -2ఝ్. -2ఞ్. -2ట్. -2ఠ్. -2డ్. -2ఢ్. -2ణ్. -2త్. -2థ్. -2ద్. -2ధ్. -2న్. -2ప్. -2ఫ్. -2బ్. -2భ్. -2మ్. -2య్. -2ర్. -2ఱ్. -2ల్. -2ళ్. -2వ్. -2శ్. -2ష్. -2స్. -2హ్. -2ర్క్. -2ర్ట్. -2ర్త్. -2ర్ప్. +1క +1ఖ +1గ +1ఘ +1ఙ +1చ +1ఛ +1జ +1ఝ +1ఞ +1ట +1ఠ +1డ +1ఢ +1ణ +1త +1థ +1ద +1ధ +1న +1ప +1ఫ +1బ +1భ +1మ +1య +1ర +1ఱ +1ల +1ళ +1వ +1శ +1ష +1స +1హ % Do not break before chandrabindu, anusvara, visarga, % length mark and ai length mark. -2ఁ -2ం -2ః -2ౕ -2ౖ +2ఁ1 +2ం1 +2ః1 +2ౕ1 +2ౖ1 % Do not break either side of virama (may be within conjunct). 2్2 -- cgit