%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % % File name: sanhyph.tex % % Unicode hyphenation patterns for Sanskrit and Prakrit in Devanagari, % Bengali, Kannada, Malayalam and Telugu scripts. % % Created: April 1st, 2005 % First release: June 8th, 2006 % Revised: % Version: 0.1 % % Created by Yves Codet with Jonathan Kew's help. % % These patterns are meant for XeTeX, a Unicode variant of TeX. % %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% \message{Sanskrit hyphenation patterns `sanhyph.tex' (v0.1) <2005/4/1>} % Set \lccode for combining marks. % Devanagari \global\lccode"0901="0901 \global\lccode"0902="0902 \global\lccode"0903="0903 \global\lccode"093E="093E \global\lccode"093F="093F \global\lccode"0940="0940 \global\lccode"0941="0941 \global\lccode"0942="0942 \global\lccode"0943="0943 \global\lccode"0944="0944 \global\lccode"0945="0945 \global\lccode"0946="0946 \global\lccode"0947="0947 \global\lccode"0948="0948 \global\lccode"094B="094B \global\lccode"094C="094C \global\lccode"094D="094D \global\lccode"0951="0951 \global\lccode"0952="0952 \global\lccode"0962="0962 \global\lccode"0963="0963 % Bengali \global\lccode"0981="0981 \global\lccode"0982="0982 \global\lccode"0983="0983 \global\lccode"09BC="09BC \global\lccode"09BE="09BE \global\lccode"09BF="09BF \global\lccode"09C0="09C0 \global\lccode"09C1="09C1 \global\lccode"09C2="09C2 \global\lccode"09C3="09C3 \global\lccode"09C4="09C4 \global\lccode"09C7="09C7 \global\lccode"09C8="09C8 \global\lccode"09CB="09CB \global\lccode"09CC="09CC \global\lccode"09CD="09CD \global\lccode"09D7="09D7 \global\lccode"09E2="09E2 \global\lccode"09E3="09E3 % Telugu \global\lccode"0C01="0C01 \global\lccode"0C02="0C02 \global\lccode"0C03="0C03 \global\lccode"0C3E="0C3E \global\lccode"0C3F="0C3F \global\lccode"0C40="0C40 \global\lccode"0C41="0C41 \global\lccode"0C42="0C42 \global\lccode"0C43="0C43 \global\lccode"0C44="0C44 \global\lccode"0C46="0C46 \global\lccode"0C47="0C47 \global\lccode"0C48="0C48 \global\lccode"0C4A="0C4A \global\lccode"0C4B="0C4B \global\lccode"0C4C="0C4C \global\lccode"0C4D="0C4D \global\lccode"0C55="0C55 \global\lccode"0C56="0C56 % Kannada \global\lccode"0C82="0C82 \global\lccode"0C83="0C83 \global\lccode"0CBD="0CBD \global\lccode"0CBE="0CBE \global\lccode"0CBF="0CBF \global\lccode"0CC0="0CC0 \global\lccode"0CC1="0CC1 \global\lccode"0CC2="0CC2 \global\lccode"0CC3="0CC3 \global\lccode"0CC4="0CC4 \global\lccode"0CC6="0CC6 \global\lccode"0CC7="0CC7 \global\lccode"0CC8="0CC8 \global\lccode"0CCA="0CCA \global\lccode"0CCB="0CCB \global\lccode"0CCC="0CCC \global\lccode"0CCD="0CCD \global\lccode"0CD5="0CD5 \global\lccode"0CD6="0CD6 % Malayalam \global\lccode"0D02="0D02 \global\lccode"0D03="0D03 \global\lccode"0D3E="0D3E \global\lccode"0D3F="0D3F \global\lccode"0D40="0D40 \global\lccode"0D41="0D41 \global\lccode"0D42="0D42 \global\lccode"0D43="0D43 \global\lccode"0D46="0D46 \global\lccode"0D47="0D47 \global\lccode"0D48="0D48 \global\lccode"0D4A="0D4A \global\lccode"0D4B="0D4B \global\lccode"0D4C="0D4C \global\lccode"0D4D="0D4D \global\lccode"0D57="0D57 % ZWNJ and ZWJ \global\lccode"200C="200C \global\lccode"200D="200D %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Allocate a \language code \newlanguage\sanskrit %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Patterns. \begingroup \language\sanskrit \patterns{ %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % GENERAL RULE % Do not break either side of ZERO-WIDTH JOINER % (U+200D) and ZERO-WIDTH NON-JOINER (U+200C) 2â€2 2‌2 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % DEVANAGARI SCRIPT % Break before or after any independent vowel. 1अ1 1आ1 1इ1 1ई1 1उ1 1ऊ1 1ऋ1 1ॠ1 1ऌ1 1ॡ1 1à¤1 1à¤1 1ओ1 1औ1 % Break after any dependent vowel but not before. 2ा1 2ि1 2ी1 2à¥1 2ू1 2ृ1 2ॄ1 2ॢ1 2ॣ1 2े1 2ै1 2ो1 2ौ1 % Break before or after any consonant. 1क1 1ख1 1ग1 1घ1 1ङ1 1च1 1छ1 1ज1 1à¤1 1ञ1 1ट1 1ठ1 1ड1 1ढ1 1ण1 1त1 1थ1 1द1 1ध1 1न1 1प1 1फ1 1ब1 1à¤1 1म1 1य1 1र1 1ल1 1ळ1 1व1 1श1 1ष1 1स1 1ह1 % Do not break before a final consonant or conjunct. 2कà¥. 2खà¥. 2गà¥. 2घà¥. 2ङà¥. 2चà¥. 2छà¥. 2जà¥. 2à¤à¥. 2ञà¥. 2टà¥. 2ठà¥. 2डà¥. 2ढà¥. 2णà¥. 2तà¥. 2थà¥. 2दà¥. 2धà¥. 2नà¥. 2पà¥. 2फà¥. 2बà¥. 2à¤à¥. 2मà¥. 2यà¥. 2रà¥. 2लà¥. 2ळà¥. 2वà¥. 2शà¥. 2षà¥. 2सà¥. 2हà¥. 2रà¥à¤•à¥. 2रà¥à¤Ÿà¥. 2रà¥à¤¤à¥. 2रà¥à¤ªà¥. % Do not break before chandrabindu, anusvara, visarga, avagraha % and accents. 2ठ2ं 2ः 2ऽ 2॑ 2॒ % Do not break either side of virama (may be within conjunct). 2à¥2 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % BENGALI SCRIPT % Break before or after any independent vowel. 1অ1 1আ1 1ই1 1ঈ1 1উ1 1ঊ1 1ঋ1 1ৠ1 1ঌ1 1ৡ1 1à¦1 1à¦1 1ও1 1ঔ1 % Break after any dependent vowel, but not before. 2া1 2ি1 2ী1 2à§1 2ূ1 2ৃ1 2ৄ1 2ৢ1 2ৣ1 2ে1 2ৈ1 2ো1 2ৌ1 % Break before or after any consonant. 1ক1 1খ1 1গ1 1ঘ1 1ঙ1 1চ1 1ছ1 1জ1 1à¦1 1ঞ1 1ট1 1ঠ1 1ড1 1ড়1 1ঢ1 1à§1 1ণ1 1ত1 1থ1 1দ1 1ধ1 1ন1 1প1 1ফ1 1ব1 1à¦1 1ম1 1য1 1য়1 1র1 1ল1 1শ1 1ষ1 1স1 1হ1 % Do not break after khanda ta. 1ৎ2 % Do not break before a final consonant or conjunct. 2কà§. 2খà§. 2গà§. 2ঘà§. 2ঙà§. 2চà§. 2ছà§. 2জà§. 2à¦à§. 2ঞà§. 2টà§. 2ঠà§. 2ডà§. 2ড়à§. 2ঢà§. 2à§à§. 2ণà§. 2তà§. 2থà§. 2দà§. 2ধà§. 2নà§. 2পà§. 2ফà§. 2বà§. 2à¦à§. 2মà§. 2যà§. 2য়à§. 2রà§. 2লà§. 2শà§. 2ষà§. 2সà§. 2হà§. 2রà§à¦•. 2রà§à¦Ÿ. 2রà§à¦¤. 2রà§à¦ª. % Do not break before chandrabindu, anusvara, visarga, avagraha, % nukta and au length mark. 2ঠ2ং 2ঃ 2ঽ 2় 2ৗ % Do not break either side of virama (may be within conjunct). 2à§2 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % KANNADA SCRIPT % Break before or after any independent vowel. 1ಅ1 1ಆ1 1ಇ1 1ಈ1 1ಉ1 1ಊ1 1ಋ1 1à³ 1 1ಌ1 1ೡ1 1ಎ1 1à²1 1à²1 1ಒ1 1ಓ1 1ಔ1 % Break after any dependent vowel, but not before. 2ಾ1 2ಿ1 2à³€1 2à³1 2ೂ1 2ೃ1 2ೄ1 2ೆ1 2ೇ1 2ೈ1 2ೊ1 2ೋ1 2ೌ1 % Break before or after any consonant. 1ಕ1 1ಖ1 1ಗ1 1ಘ1 1ಙ1 1ಚ1 1ಛ1 1ಜ1 1à²1 1ಞ1 1ಟ1 1ಠ1 1ಡ1 1ಢ1 1ಣ1 1ತ1 1ಥ1 1ದ1 1ಧ1 1ನ1 1ಪ1 1ಫ1 1ಬ1 1à²1 1ಮ1 1ಯ1 1ರ1 1ಱ1 % can occur in Sanskrit? 1ಲ1 1ಳ1 1ೞ1 % can occur in Sanskrit? 1ವ1 1ಶ1 1ಷ1 1ಸ1 1ಹ1 % Do not break before a final consonant or conjunct. 2ಕà³. 2ಖà³. 2ಗà³. 2ಘà³. 2ಙà³. 2ಚà³. 2ಛà³. 2ಜà³. 2à²à³. 2ಞà³. 2ಟà³. 2ಠà³. 2ಡà³. 2ಢà³. 2ಣà³. 2ತà³. 2ಥà³. 2ದà³. 2ಧà³. 2ನà³. 2ಪà³. 2ಫà³. 2ಬà³. 2à²à³. 2ಮà³. 2ಯà³. 2ರà³. 2ಱà³. % can occur in Sanskrit? 2ಲà³. 2ಳà³. 2ವà³. 2ಶà³. 2ಷà³. 2ಸà³. 2ಹà³. 2ರà³à²•. 2ರà³à²Ÿ. 2ರà³à²¤. 2ರà³à²ª. % Do not break before anusvara, visarga, avagraha, % length mark and ai length mark. 2ಂ 2ಃ 2ಽ 2ೕ 2à³– % Do not break either side of virama (may be within conjunct). 2à³2 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % MALAYALAM SCRIPT % Break before or after any independent vowel. 1à´…1 1à´†1 1à´‡1 1à´ˆ1 1à´‰1 1à´Š1 1à´‹1 1ൠ1 1à´Œ1 1ൡ1 1à´Ž1 1à´1 1à´1 1à´’1 1à´“1 1à´”1 % Break after any dependent vowel, but not before. 2à´¾1 2à´¿1 2ീ1 2àµ1 2ൂ1 2ൃ1 2െ1 2േ1 2ൈ1 2ൊ1 2ോ1 2ൌ1 % Break before or after any consonant. 1à´•1 1à´–1 1à´—1 1à´˜1 1à´™1 1à´š1 1à´›1 1à´œ1 1à´1 1à´ž1 1à´Ÿ1 1à´ 1 1à´¡1 1à´¢1 1à´£1 1à´¤1 1à´¥1 1à´¦1 1à´§1 1à´¨1 1à´ª1 1à´«1 1à´¬1 1à´1 1à´®1 1à´¯1 1à´°1 1à´±1 % can occur in Sanskrit? 1à´²1 1à´³1 1à´´1 % can occur in Sanskrit? 1à´µ1 1à´¶1 1à´·1 1à´¸1 1à´¹1 % Do not break before a final consonant or conjunct. 2à´•àµ. 2à´–àµ. 2à´—àµ. 2à´˜àµ. 2à´™àµ. 2à´šàµ. 2à´›àµ. 2à´œàµ. 2à´àµ. 2à´žàµ. 2à´Ÿàµ. 2à´ àµ. 2à´¡àµ. 2à´¢àµ. 2à´£àµ. 2à´¤àµ. 2à´¥àµ. 2à´¦àµ. 2à´§àµ. 2à´¨àµ. 2à´ªàµ. 2à´«àµ. 2à´¬àµ. 2à´àµ. 2à´®àµ. 2à´¯àµ. 2à´°àµ. 2à´±àµ. % can occur in Sanskrit? 2à´²àµ. 2à´³àµ. 2à´´àµ. % can occur in Sanskrit? 2à´µàµ. 2à´¶àµ. 2à´·àµ. 2à´¸àµ. 2à´¹àµ. 2à´°àµà´•. 2à´°àµà´Ÿ. 2à´°àµà´¤. 2à´°àµà´ª. % Do not break before anusvara, visarga and length mark. 2à´‚ 2à´ƒ 2ൗ % Do not break either side of virama (may be within conjunct). 2àµ2 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % TELUGU SCRIPT % Break before or after any independent vowel. 1à°…1 1à°†1 1à°‡1 1à°ˆ1 1à°‰1 1à°Š1 1à°‹1 1à± 1 1à°Œ1 1ౡ1 1à°Ž1 1à°1 1à°1 1à°’1 1à°“1 1à°”1 % Break after any dependent vowel, but not before. 2à°¾1 2à°¿1 2à±€1 2à±1 2ూ1 2ృ1 2ౄ1 2ె1 2ే1 2ై1 2ొ1 2ో1 2ౌ1 % Break before or after any consonant. 1à°•1 1à°–1 1à°—1 1à°˜1 1à°™1 1à°š1 1à°›1 1à°œ1 1à°1 1à°ž1 1à°Ÿ1 1à° 1 1à°¡1 1à°¢1 1à°£1 1à°¤1 1à°¥1 1à°¦1 1à°§1 1à°¨1 1à°ª1 1à°«1 1à°¬1 1à°1 1à°®1 1à°¯1 1à°°1 1à°±1 % can occur in Sanskrit? 1à°²1 1à°³1 1à°µ1 1à°¶1 1à°·1 1à°¸1 1à°¹1 % Do not break before a final consonant or conjunct. 2à°•à±. 2à°–à±. 2à°—à±. 2à°˜à±. 2à°™à±. 2à°šà±. 2à°›à±. 2à°œà±. 2à°à±. 2à°žà±. 2à°Ÿà±. 2à° à±. 2à°¡à±. 2à°¢à±. 2à°£à±. 2à°¤à±. 2à°¥à±. 2à°¦à±. 2à°§à±. 2à°¨à±. 2à°ªà±. 2à°«à±. 2à°¬à±. 2à°à±. 2à°®à±. 2à°¯à±. 2à°°à±. 2à°±à±. % can occur in Sanskrit? 2à°²à±. 2à°³à±. 2à°µà±. 2à°¶à±. 2à°·à±. 2à°¸à±. 2à°¹à±. 2à°°à±à°•à±. 2à°°à±à°Ÿà±. 2à°°à±à°¤à±. 2à°°à±à°ªà±. % Do not break before chandrabindu, anusvara, visarga, % length mark and ai length mark. 2à° 2à°‚ 2à°ƒ 2ౕ 2à±– % Do not break either side of virama (may be within conjunct). 2à±2 } \endgroup