-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtransliterators-sample.json
22 lines (22 loc) · 26.1 KB
/
transliterators-sample.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
[
{
"name": "Balinese-InterIndic",
"rules": "::NFC;\n\nᬒᬁ → \\uE050; # OM\n#ᬀ → \\uE001; # SIGN ULU RICEM\nᬁ → \\uE001; # SIGN ULU CANDRA\nᬂ → \\uE002; # SIGN CECEK\n#ᬃ → \\uE030\\uE04D; # SIGN SURANG\nᬄ → \\uE003; # SIGN BISAH\nᬅ → \\uE005; # LETTER AKARA\nᬆ → \\uE006; # LETTER AKARA TEDUNG\nᬇ → \\uE007; # LETTER IKARA\nᬈ → \\uE008; # LETTER IKARA TEDUNG\nᬉ → \\uE009; # LETTER UKARA\nᬊ → \\uE00A; # LETTER UKARA TEDUNG\nᬋ → \\uE00B; # LETTER RA REPA\nᬌ → \\uE060; # LETTER RA REPA TEDUNG\nᬍ → \\uE00C; # LETTER LA LENGA\nᬎ → \\uE061; # LETTER LA LENGA TEDUNG\nᬏ → \\uE00F; # LETTER EKARA\nᬐ → \\uE010; # LETTER AIKARA\nᬑ → \\uE013; # LETTER OKARA\nᬒ → \\uE014; # LETTER OKARA TEDUNG\nᬓ → \\uE015; # LETTER KA\nᬔ → \\uE016; # LETTER KA MAHAPRANA\nᬕ → \\uE017; # LETTER GA\nᬖ → \\uE018; # LETTER GA GORA\nᬗ → \\uE019; # LETTER NGA\nᬘ → \\uE01A; # LETTER CA\nᬙ → \\uE01B; # LETTER CA LACA\nᬚ → \\uE01C; # LETTER JA\nᬛ → \\uE01D; # LETTER JA JERA\nᬜ → \\uE01E; # LETTER NYA\nᬝ → \\uE01F; # LETTER TA LATIK\nᬞ → \\uE020; # LETTER TA MURDA MAHAPRANA\nᬟ → \\uE021; # LETTER DA MURDA ALPAPRANA\nᬠ → \\uE022; # LETTER DA MURDA MAHAPRANA\nᬡ → \\uE023; # LETTER NA RAMBAT\nᬢ → \\uE024; # LETTER TA\nᬣ → \\uE025; # LETTER TA TAWA\nᬤ → \\uE026; # LETTER DA\nᬥ → \\uE027; # LETTER DA MADU\nᬦ → \\uE028; # LETTER NA\nᬧ → \\uE02A; # LETTER PA\nᬨ → \\uE02B; # LETTER PA KAPAL\nᬩ → \\uE02C; # LETTER BA\nᬪ → \\uE02D; # LETTER BA KEMBANG\nᬫ → \\uE02E; # LETTER MA\nᬬ → \\uE02F; # LETTER YA\nᬭ → \\uE030; # LETTER RA\nᬮ → \\uE032; # LETTER LA\nᬯ → \\uE035; # LETTER WA\nᬰ → \\uE036; # LETTER SA SAGA\nᬱ → \\uE037; # LETTER SA SAPA\nᬲ → \\uE038; # LETTER SA\nᬳ → \\uE039; # LETTER HA\n᬴ → \\uE03C; # SIGN REREKAN\nᬵ → \\uE03E; # VOWEL SIGN TEDUNG\nᬶ → \\uE03F; # VOWEL SIGN ULU\nᬷ → \\uE040; # VOWEL SIGN ULU SARI\nᬸ → \\uE041; # VOWEL SIGN SUKU\nᬹ → \\uE042; # VOWEL SIGN SUKU ILUT\nᬺ → \\uE043; # VOWEL SIGN RA REPA\nᬻ → \\uE044; # VOWEL SIGN RA REPA TEDUNG\nᬼ→ \\uE062; # VOWEL SIGN LA LENGA\nᬽ → \\uE063; # VOWEL SIGN LA LENGA TEDUNG\nᬾ → \\uE047; # VOWEL SIGN TALING\nᬿ → \\uE048; # VOWEL SIGN TALING REPA\nᭀ → \\uE04B; # VOWEL SIGN TALING TEDUNG\nᭁ → \\uE04C; # VOWEL SIGN TALING REPA TEDUNG\nᭂ → \\uE045; # VOWEL SIGN PEPET\nᭃ → \\uE049; # VOWEL SIGN PEPET TEDUNG\n᭄ → \\uE04D; # ADEG ADEG\nᭅ → \\uE058; # LETTER KAF SASAK\nᭆ → \\uE059; # LETTER KHOT SASAK\nᭇ → \\uE024\\uE03C; # LETTER TZIR SASAK\nᭈ → \\uE05E; # LETTER EF SASAK\nᭉ → \\uE081; # LETTER VE SASAK\nᭊ → \\uE05B; # LETTER ZAL SASAK\nᭋ → \\uE038\\uE03C; # LETTER ASYURA SASAK\n᭐ → \\uE066; # DIGIT ZERO\n᭑ → \\uE067; # DIGIT ONE\n᭒ → \\uE068; # DIGIT TWO\n᭓ → \\uE069; # DIGIT THREE\n᭔ → \\uE06A; # DIGIT FOUR\n᭕ → \\uE06B; # DIGIT FIVE\n᭖ → \\uE06C; # DIGIT SIX\n᭗ → \\uE06D; # DIGIT SEVEN\n᭘ → \\uE06E; # DIGIT EIGHT\n᭙ → \\uE06F; # DIGIT NINE\n᭚ → ' // '; # PANTI\n᭛ → ' /// '; # PAMADA\n᭜ → •; # WINDU\n᭟᭜᭟ → ' \\\\•\\\\ ';\n᭟ ' ' ᭜ ' ' ᭟ → ' \\\\ • \\\\ ';\n᭝ → \\:; # CARIK PAMUNGKAH\n᭞ → \\uE064; # CARIK SIKI\n᭟ → \\uE065; # CARIK PAREREN\n᭠ → ‐; # PAMENENG\n"
},
{
"name": "InterIndic-ban_000",
"rules": "#\\u0E00 reserved\n#consonants\n$chandrabindu=\\uE001;\n$ardhachandra=\\u1B00;\n$anusvara=\\uE002;\n$visarga=\\uE003;\n#\\u0E004 reserved\n# w←vowel→ represents the stand-alone form\n$wa=\\uE005;\n$waa=\\uE006;\n$wi=\\uE007;\n$wii=\\uE008;\n$wu=\\uE009;\n$wuu=\\uE00A;\n$wr=\\uE00B;\n$wl=\\uE00C;\n$wce=\\uE00D; # LETTER CANDRA E\n$wse=\\uE00E; # LETTER SHORT E\n$we=\\uE00F; # ए LETTER E\n$wai=\\uE010;\n$wco=\\uE011; # LETTER CANDRA O\n$wso=\\uE012; # LETTER SHORT O\n$wo=\\uE013; # ओ LETTER O\n$wau=\\uE014;\n$ka=\\uE015;\n$kha=\\uE016;\n$ga=\\uE017;\n$gha=\\uE018;\n$nga=\\uE019;\n$ca=\\uE01A;\n$cha=\\uE01B;\n$ja=\\uE01C;\n$jha=\\uE01D;\n$nya=\\uE01E;\n$tta=\\uE01F;\n$ttha=\\uE020;\n$dda=\\uE021;\n$ddha=\\uE022;\n$nna=\\uE023;\n$ta=\\uE024;\n$tha=\\uE025;\n$da=\\uE026;\n$dha=\\uE027;\n$na=\\uE028;\n$ena=\\uE029; #compatibility\n$pa=\\uE02A;\n$pha=\\uE02B;\n$ba=\\uE02C;\n$bha=\\uE02D;\n$ma=\\uE02E;\n$ya=\\uE02F;\n$ra=\\uE030;\n$vva=\\uE081;\n$rra=\\uE031;\n$la=\\uE032;\n$lla=\\uE033;\n$ela=\\uE034; #compatibility\n$va=\\uE035;\n$sha=\\uE036;\n$ssa=\\uE037;\n$sa=\\uE038;\n$ha=\\uE039;\n#\\u093A Reserved\n#\\u093B Reserved\n$nukta=\\uE03C;\n$avagraha=\\uE03D; # SIGN AVAGRAHA\n# ←vowel→ represents the dependent form\n$aa=\\uE03E;\n$i=\\uE03F;\n$ii=\\uE040;\n$u=\\uE041;\n$uu=\\uE042;\n$rh=\\uE043;\n$rrh=\\uE044;\n$ce=\\uE045; #VOWEL SIGN CANDRA E\n$se=\\uE046; #VOWEL SIGN SHORT E\n$e=\\uE047;\n$ai=\\uE048;\n$co=\\uE049; # VOWEL SIGN CANDRA O\n$so=\\uE04A; # VOWEL SIGN SHORT O\n$o=\\uE04B; # ो\n$au=\\uE04C;\n$virama=\\uE04D;\n# \\u094E Reserved\n# \\u094F Reserved\n$om=\\uE050; # OM\n\\uE051→; # UNMAPPED STRESS SIGN UDATTA\n\\uE052→; # UNMAPPED STRESS SIGN ANUDATTA\n\\uE053→; # UNMAPPED GRAVE ACCENT\n\\uE054→; # UNMAPPED ACUTE ACCENT\n$lm = \\uE055;# Telugu Length Mark\n$ailm=\\uE056;# AI Length Mark\n$aulm=\\uE057;# AU Length Mark\n#urdu compatibity forms\n$uka=\\uE058;\n$ukha=\\uE059;\n$ugha=\\uE05A;\n$ujha=\\uE05B;\n$uddha=\\uE05C;\n$udha=\\uE05D;\n$ufa=\\uE05E;\n$uya=\\uE05F;\n$wrr=\\uE060;\n$wll=\\uE061;\n$lh=\\uE062;\n$llh=\\uE063;\n$danda=\\uE064;\n$doubleDanda=\\uE065;\n$zero=\\uE066; # DIGIT ZERO\n$one=\\uE067; # DIGIT ONE\n$two=\\uE068; # DIGIT TWO\n$three=\\uE069; # DIGIT THREE\n$four=\\uE06A; # DIGIT FOUR\n$five=\\uE06B; # DIGIT FIVE\n$six=\\uE06C; # DIGIT SIX\n$seven=\\uE06D; # DIGIT SEVEN\n$eight=\\uE06E; # DIGIT EIGHT\n$nine=\\uE06F; # DIGIT NINE\n# Glottal stop\n$dgs=\\uE082;\n#Khanda-ta\n$kta=\\uE083;\n$depVowelAbove=[\\uE03E-\\uE040\\uE045-\\uE04C];\n$depVowelBelow=[\\uE041-\\uE044];\n# $x was originally called '§'; $z was '%'\n$x=[$aa$ai$au$ii$i$uu$u$rrh$rh$lh$llh$e$o$se$ce$so$co];\n$z=[bcdfghjklmnpqrstvwxyz];\n$vowels=[aeiour̥̄̆];\n$forceIndependentMatra = [^[[:L:][̀-͌]]];\n######################################################################\n# convert from Native letters to Latin letters\n######################################################################\n\n#anusvara\n$anusvara} [$ka$kha$ga$gha$nga] → ng;\n$anusvara} [$ca$cha$ja$jha$nya] → n;\n$anusvara} [$tta$ttha$dda$ddha$nna] → n;\n$anusvara} [$ta$tha$da$dha$na] → n;\n$anusvara} [$pa$pha$ba$bha$ma] → m;\n$anusvara} [$ya$ra$lla$la$va$ssa$sha$sa$ha] → n;\n$anusvara→ ng;\n\n#surang\nᬃ → r;\n\n# Urdu compatibility\n$ya$nukta}$x → y;\n$ya$nukta$virama → y;\n$ya$nukta → ya;\n$la$nukta }$x → l;\n$la$nukta$virama → l;\n$la$nukta → la;\n$na$nukta }$x → n;\n$na$nukta$virama → n;\n$na$nukta → na;\n$ena }$x → n;\n$ena$virama → n;\n$ena → na;\n$uka → qa;\n$ka$nukta }$x → q;\n$ka$nukta$virama → q;\n$ka$nukta → qa;\n$kha$nukta }$x → kh;\n$kha$nukta$virama → kh;\n$kha$nukta → kha;\n$ukha$virama → kh;\n$ukha → kha;\n$ugha → gha;\n$ga$nukta }$x → gh;\n$ga$nukta$virama → gh;\n$ga$nukta → gha;\n$ujha → za;\n$ja$nukta }$x → z;\n$ja$nukta$virama → z;\n$ja$nukta → za;\n$ddha$nukta}$x → r;\n$ddha$nukta$virama → r;\n$ddha$nukta → ra;\n$uddha}$x → r;\n$uddha$virama → r;\n$uddha → ra;\n$udha → ra;\n$dda$nukta}$x → r;\n$dda$nukta$virama → r;\n$dda$nukta → ra;\n$pha$nukta }$x → f;\n$pha$nukta$virama → f;\n$pha$nukta → fa;\n$ufa }$x → f;\n$ufa$virama → f;\n$ufa → fa;\n$ra$nukta}$x → r;\n$ra$nukta$virama → r;\n$ra$nukta → ra;\n$lla$nukta}$x → l;\n$lla$nukta$virama → l;\n$lla$nukta → la;\n$ela}$x → l;\n$ela$virama → l;\n$ela → la;\n$uya}$x → y;\n$uya$virama → y;\n$uya → ya;\n\n# normal consonants\n#$ka$virama}$ha→k'';\n$ka}$x→k;\n$ka$virama→k;\n$ka→ka;\n$kha}$x→k;\n$kha$virama→k;\n$kha→ka;\n#$ga$virama}$ha→g'';\n$ga}$x→g;\n$ga$virama→g;\n$ga→ga;\n$gha}$x→g;\n$gha$virama→g;\n$gha→ga;\n$nga}$x→ng;\n$nga$virama→ng;\n$nga→nga;\n#$ca$virama}$ha→c'';\n$ca}$x→c;\n$ca$virama→c;\n$ca→ca;\n$cha}$x→c;\n$cha$virama→c;\n$cha→ca;\n#$ja$virama}$ha→j'';\n$ja}$x→j;\n$ja$virama→j;\n$ja→ja;\n$jha}$x→j;\n$jha$virama→j;\n$jha→ja;\n$nya }$x→ny;\n$nya$virama }[$ca$cha$ja$jha$nya]→n;\n$nya$virama→ny;\n$nya → nya;\n#$tta$virama}$ha→t'';\n$tta}$x→t;\n$tta$virama→t;\n$tta→ta;\n$ttha}$x→t;\n$ttha$virama→t;\n$ttha→ta;\n#$dda}$x$ha→d'';\n$dda}$x→d;\n$dda$virama→d;\n$dda→da;\n$ddha}$x→d;\n$ddha$virama→d;\n$ddha→da;\n$nna}$x→n;\n$nna$virama→n;\n$nna→na;\n#$ta$virama}$ha→t'';\n#$ta$virama}$ttha→t'';\n#$ta$virama}$tta→t'';\n#$ta$virama}$tha→t'';\n$ta}$x→t;\n$ta$virama→t;\n$ta→ta;\n$tha}$x→t;\n$tha$virama→t;\n$tha→ta;\n#$da$virama}$ha→d'';\n#$da$virama}$ddha→d'';\n#$da$virama}$dda→d'';\n#$da$virama}$dha→d'';\n$da}$x→d;\n$da$virama→d;\n$da→da;\n$dha}$x→d;\n$dha$virama→d;\n$dha→da;\n$na$virama}$ga→n'';\n$na$virama}$ya→n'';\n$na}$x→n;\n$na$virama→n;\n$na→na;\n#$pa$virama}$ha→p'';\n$pa}$x→p;\n$pa$virama→p;\n$pa→pa;\n$pha}$x→p;\n$pha$virama→p;\n$pha→pa;\n#$ba$virama}$ha→b'';\n$ba}$x→b;\n$ba$virama→b;\n$ba→ba;\n$bha}$x→b;\n$bha$virama→b;\n$bha→ba;\n#$ma$virama}$ma→m'';\n$ma}$x→m;\n$ma$virama→m;\n$ma→ma;\n$ya}$x→y;\n$ya$virama→y;\n$ya→ya;\n#$ra$virama}$ha→r'';\n$ra}$x→r;\n$ra$virama→r;\n$ra→ra;\n#$vva$virama}$ha→ẇ'';\n$vva}$x→w;\n$vva$virama→w;\n$vva→wa;\n#$rra$virama}$ha→ṟ'';\n$rra}$x→r;\n$rra$virama→r;\n$rra→ra;\n#$la$virama}$ha→l'';\n$la}$x→l;\n$la$virama→l;\n$la→la;\n#$lla$virama}$ha→ḷ'';\n$lla}$x→l;\n$lla$virama→l;\n$lla→la;\n$va}$x→w;\n$va$virama→w;\n$va→wa;\n#$sa$virama}$ha→s'';\n#$sa$virama}$sha→s'';\n#$sa$virama}$ssa→s'';\n#$sa$virama}$sa→s'';\n$sa}$x→s;\n$sa$virama→s;\n\n#for gurmukhi\n$sa$nukta}$x→sy;\n$sa$nukta$virama→sy;\n$sa$nukta→sya;\n$sa→sa;\n$sha}$x→sy;\n$sha$virama→sy;\n$sha→sya;\n$ssa}$x→sy;\n$ssa$virama→sy;\n$ssa→sya;\n$ha}$x→h;\n$ha$virama→h;\n$ha→ha;\n\n# dependent vowels (should never occur except following consonants)\n$forceIndependentMatra{$aa → ̔ā;\n$forceIndependentMatra{$ai → ̔ai;\n$forceIndependentMatra{$au → ̔au;\n$forceIndependentMatra{$ii → ̔ī;\n$forceIndependentMatra{$i → ̔i;\n$forceIndependentMatra{$uu → ̔ū;\n$forceIndependentMatra{$u → ̔u;\n$forceIndependentMatra{$rrh → ̔rē;\n$forceIndependentMatra{$rh → ̔re;\n$forceIndependentMatra{$llh → ̔lē;\n$forceIndependentMatra{$lh → ̔le;\n$forceIndependentMatra{$e → ̔é;\n$forceIndependentMatra{$o → ̔o;\n#extra vowels\n$forceIndependentMatra{$ce → ̔e;\n$forceIndependentMatra{$co → ̔ē;\n$forceIndependentMatra{$se → ̔e;\n$forceIndependentMatra{$so → ̔o;\n$forceIndependentMatra{$nukta →; # Nukta cannot appear independently or as first character\n$forceIndependentMatra{$virama →; # Virama cannot appear independently or as first character\n$aa → ā;\n$ai → ai;\n$au → au;\n$ii → ī;\n$i → i;\n$uu → ū;\n$u → u;\n$rrh → rē;\n$rh → re;\n$llh → lē;\n$lh → le;\n$e → é;\n$o → o;\n#extra vowels\n$ce → e;\n$co → ē;\n$se → e;\n$so → o;\n\n#dependent vowels when following independent vowels. Generally Illegal only for roundtripping\n$waa} $x → ā;\n$wai} $x → ai;\n$wau} $x → au;\n$wii} $x → ī;\n$wi } $x → i;\n$wuu} $x → ū;\n$wu } $x → u;\n$wrr} $x → rē;\n$wr } $x → re;\n$wll} $x → lē;\n$wl } $x → le;\n$we } $x → é;\n$wo } $x → o;\n$wa } $x → a;\n#extra vowels\n$wce} $x → e;\n$wco} $x → ē;\n$wse} $x → e;\n$wso} $x → o;\n$om} $x → om;\n\n# independent vowels when preceeded by vowels\n$vowels{$waa → ''ā;\n$vowels{$wai → ''ai;\n$vowels{$wau → ''au;\n$vowels{$wii → ''ī;\n$vowels{$wi → ''i;\n$vowels{$wuu → ''ū;\n$vowels{$wu → ''u;\n$vowels{$wrr → ''rē;\n$vowels{$wr → ''re;\n$vowels{$wll → ''lē;\n$vowels{$wl → ''le;\n$vowels{$we → ''é;\n$vowels{$wo → ''o;\n$vowels{$wa → ''a;\n#extra vowels\n$vowels{$wce → ''e;\n$vowels{$wco → ''ē;\n$vowels{$wse → ''e;\n$vowels{$wso → ''o;\n$vowels{$om → ''om;\n\n# independent vowels (otherwise)\n$waa → ā;\n$wai → ai;\n$wau → au;\n$wii → ī;\n$wi → i;\n$wuu → ū;\n$wu → u;\n$wrr → rē;\n$wr → re;\n$wll → lē;\n$wl → le;\n$we → é;\n$wo → o;\n$wa → a;\n#extra vowels\n$wce → e;\n$wco → ē;\n$wse → e;\n$wso → o;\n$om → om;\n\n#stress marks\n$avagraha → ;\n$chandrabindu → ng;\n$ardhachandra → m;\n$visarga → h;\n\n#numbers\n$zero → 0;\n$one → 1;\n$two → 2;\n$three → 3;\n$four → 4;\n$five → 5;\n$six → 6;\n$seven → 7;\n$eight → 8;\n$nine → 9;\n$lm →;\n$ailm →;\n$aulm →;\n$dgs→'';\n$kta→t;\n# Balinese numbers are surrounded by dandas which can be removed\n$danda } [$zero$one$two$three$four$five$six$seven$eight$nine] →;\n[0123456789] { $danda →;\n$danda→',';\n$doubleDanda→'.';\n\n\\uE070→; # ABBREVIATION SIGN\n# LETTER RA WITH MIDDLE DIAGONAL\n\\uE071}$x→ra;\n\\uE071$virama→r;\n\\uE071→ra;\n# LETTER RA WITH LOWER DIAGONAL\n\\uE072}$x→ra;\n\\uE072$virama→r;\n\\uE072→ra;\n\\uE073→; # RUPEE MARK\n\\uE074→; # RUPEE SIGN\n\\uE075→; # CURRENCY NUMERATOR ONE\n\\uE076→; # CURRENCY NUMERATOR TWO\n\\uE077→; # CURRENCY NUMERATOR THREE\n\\uE078→; # CURRENCY NUMERATOR FOUR\n\\uE079→; # CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR\n\\uE07A→; # CURRENCY DENOMINATOR SIXTEEN\n\\uE07B→; # ISSHAR\n\\uE07C→; # TIPPI\n\\uE07D→; # ADDAK\n\\uE07E→; # IRI\n\\uE07F→; # URA\n\\uE080→; # EK ONKAR\n\\uE004→; # DEVANAGARI VOWEL SIGN SHORT A\n\n::NFC;\n"
},
{
"name": "Balinese-ban_000",
"rules": "::Balinese-InterIndic;\n::InterIndic-ban_000;\n"
},
{
"name": "InterIndic-ban_001",
"rules": "#\\u0E00 reserved\n#consonants\n$chandrabindu=\\uE001;\n$ardhachandra=\\u1B00;\n$anusvara=\\uE002;\n$visarga=\\uE003;\n#\\u0E004 reserved\n# w←vowel→ represents the stand-alone form\n$wa=\\uE005;\n$waa=\\uE006;\n$wi=\\uE007;\n$wii=\\uE008;\n$wu=\\uE009;\n$wuu=\\uE00A;\n$wr=\\uE00B;\n$wl=\\uE00C;\n$wce=\\uE00D; # LETTER CANDRA E\n$wse=\\uE00E; # LETTER SHORT E\n$we=\\uE00F; # ए LETTER E\n$wai=\\uE010;\n$wco=\\uE011; # LETTER CANDRA O\n$wso=\\uE012; # LETTER SHORT O\n$wo=\\uE013; # ओ LETTER O\n$wau=\\uE014;\n$ka=\\uE015;\n$kha=\\uE016;\n$ga=\\uE017;\n$gha=\\uE018;\n$nga=\\uE019;\n$ca=\\uE01A;\n$cha=\\uE01B;\n$ja=\\uE01C;\n$jha=\\uE01D;\n$nya=\\uE01E;\n$tta=\\uE01F;\n$ttha=\\uE020;\n$dda=\\uE021;\n$ddha=\\uE022;\n$nna=\\uE023;\n$ta=\\uE024;\n$tha=\\uE025;\n$da=\\uE026;\n$dha=\\uE027;\n$na=\\uE028;\n$ena=\\uE029; #compatibility\n$pa=\\uE02A;\n$pha=\\uE02B;\n$ba=\\uE02C;\n$bha=\\uE02D;\n$ma=\\uE02E;\n$ya=\\uE02F;\n$ra=\\uE030;\n$vva=\\uE081;\n$rra=\\uE031;\n$la=\\uE032;\n$lla=\\uE033;\n$ela=\\uE034; #compatibility\n$va=\\uE035;\n$sha=\\uE036;\n$ssa=\\uE037;\n$sa=\\uE038;\n$ha=\\uE039;\n#\\u093A Reserved\n#\\u093B Reserved\n$nukta=\\uE03C;\n$avagraha=\\uE03D; # SIGN AVAGRAHA\n# ←vowel→ represents the dependent form\n$aa=\\uE03E;\n$i=\\uE03F;\n$ii=\\uE040;\n$u=\\uE041;\n$uu=\\uE042;\n$rh=\\uE043;\n$rrh=\\uE044;\n$ce=\\uE045; #VOWEL SIGN CANDRA E\n$se=\\uE046; #VOWEL SIGN SHORT E\n$e=\\uE047;\n$ai=\\uE048;\n$co=\\uE049; # VOWEL SIGN CANDRA O\n$so=\\uE04A; # VOWEL SIGN SHORT O\n$o=\\uE04B; # ो\n$au=\\uE04C;\n$virama=\\uE04D;\n# \\u094E Reserved\n# \\u094F Reserved\n$om=\\uE050; # OM\n\\uE051→; # UNMAPPED STRESS SIGN UDATTA\n\\uE052→; # UNMAPPED STRESS SIGN ANUDATTA\n\\uE053→; # UNMAPPED GRAVE ACCENT\n\\uE054→; # UNMAPPED ACUTE ACCENT\n$lm = \\uE055;# Telugu Length Mark\n$ailm=\\uE056;# AI Length Mark\n$aulm=\\uE057;# AU Length Mark\n#urdu compatibity forms\n$uka=\\uE058;\n$ukha=\\uE059;\n$ugha=\\uE05A;\n$ujha=\\uE05B;\n$uddha=\\uE05C;\n$udha=\\uE05D;\n$ufa=\\uE05E;\n$uya=\\uE05F;\n$wrr=\\uE060;\n$wll=\\uE061;\n$lh=\\uE062;\n$llh=\\uE063;\n$danda=\\uE064;\n$doubleDanda=\\uE065;\n$zero=\\uE066; # DIGIT ZERO\n$one=\\uE067; # DIGIT ONE\n$two=\\uE068; # DIGIT TWO\n$three=\\uE069; # DIGIT THREE\n$four=\\uE06A; # DIGIT FOUR\n$five=\\uE06B; # DIGIT FIVE\n$six=\\uE06C; # DIGIT SIX\n$seven=\\uE06D; # DIGIT SEVEN\n$eight=\\uE06E; # DIGIT EIGHT\n$nine=\\uE06F; # DIGIT NINE\n# Glottal stop\n$dgs=\\uE082;\n#Khanda-ta\n$kta=\\uE083;\n$depVowelAbove=[\\uE03E-\\uE040\\uE045-\\uE04C];\n$depVowelBelow=[\\uE041-\\uE044];\n# $x was originally called '§'; $z was '%'\n$x=[$aa$ai$au$ii$i$uu$u$rrh$rh$lh$llh$e$o$se$ce$so$co];\n$z=[bcdfghjklmnpqrstvwxyz];\n$vowels=[aeiour̥̄̆];\n$forceIndependentMatra = [^[[:L:][̀-͌]]];\n$strike=\\u0336;\n\n######################################################################\n# normalize input\n######################################################################\n\n# delete zwnj\n\\u200C→;\n# reprocess from beginning\n::Null;\n\n######################################################################\n# convert from Native letters to Latin letters\n######################################################################\n\n#glottal stop\n$wa$virama → k'';\n\n#anusvara\n$anusvara → ng;\n\n#surang\nᬃ → r̀;\n\n# Urdu compatibility\n$ya$nukta}$x → y;\n$ya$nukta$virama → y;\n$ya$nukta → ya;\n$la$nukta }$x → l;\n$la$nukta$virama → l;\n$la$nukta → la;\n$na$nukta }$x → n;\n$na$nukta$virama → n;\n$na$nukta → na;\n$ena }$x → n;\n$ena$virama → n;\n$ena → na;\n$uka → qa;\n$ka$nukta }$x → q;\n$ka$nukta$virama → q;\n$ka$nukta → qa;\n$kha$nukta }$x → kh;\n$kha$nukta$virama → kh;\n$kha$nukta → kha;\n$ukha$virama → kh;\n$ukha → kha;\n$ugha → gha;\n$ga$nukta }$x → gh;\n$ga$nukta$virama → gh;\n$ga$nukta → gha;\n$ujha → za;\n$ja$nukta }$x → z;\n$ja$nukta$virama → z;\n$ja$nukta → za;\n$ddha$nukta}$x → r;\n$ddha$nukta$virama → r;\n$ddha$nukta → ra;\n$uddha}$x → r;\n$uddha$virama → r;\n$uddha → ra;\n$udha → ra;\n$dda$nukta}$x → r;\n$dda$nukta$virama → r;\n$dda$nukta → ra;\n$pha$nukta }$x → f;\n$pha$nukta$virama → f;\n$pha$nukta → fa;\n$ufa }$x → f;\n$ufa$virama → f;\n$ufa → fa;\n$ra$nukta}$x → r;\n$ra$nukta$virama → r;\n$ra$nukta → ra;\n$lla$nukta}$x → l;\n$lla$nukta$virama → l;\n$lla$nukta → la;\n$ela}$x → l;\n$ela$virama → l;\n$ela → la;\n$uya}$x → y;\n$uya$virama → y;\n$uya → ya;\n\n# normal consonants\n$ka$virama}$ha→k'';\n$ka}$x→k;\n$ka$virama→k;\n$ka→ka;\n$kha$i$u→k $strike h $strike;\n$kha}$x→kh;\n$kha$virama→kh;\n$kha→kha;\n$ga$virama}$ha→g'';\n$ga}$x→g;\n$ga$virama→g;\n$ga→ga;\n$gha$i$u→g $strike h $strike;\n$gha}$x→gh;\n$gha$virama→gh;\n$gha→gha;\n$nga$i$u→n $strike g $strike;\n$nga}$x→ng;\n$nga$virama→ng;\n$nga→nga;\n$ca$virama}$ha→c'';\n$ca}$x→c;\n$ca$virama→c;\n$ca→ca;\n$cha$i$u→c $strike h $strike;\n$cha}$x→ch;\n$cha$virama→ch;\n$cha→cha;\n$ja$virama}$ha→j'';\n$ja}$x→j;\n$ja$virama→j;\n$ja→ja;\n$jha$i$u→j $strike h $strike;\n$jha}$x→jh;\n$jha$virama→jh;\n$jha→jha;\n$nya }$x→ñ;\n#$nya$virama }[$ca$cha$ja$jha$nya]→n;\n$nya$virama→ñ;\n$nya → ña;\n$tta$virama}$ha→ṭ'';\n$tta}$x→ṭ;\n$tta$virama→ṭ;\n$tta→ṭa;\n$ttha$i$u→ṭ $strike h $strike;\n$ttha}$x→ṭh;\n$ttha$virama→ṭh;\n$ttha→ṭha;\n$dda}$x$ha→ḍ'';\n$dda}$x→ḍ;\n$dda$virama→ḍ;\n$dda→ḍa;\n$ddha$i$u→ḍ $strike h $strike;\n$ddha}$x→ḍh;\n$ddha$virama→ḍh;\n$ddha→ḍha;\n$nna}$x→ṇ;\n$nna$virama→ṇ;\n$nna→ṇa;\n$ta$virama}$ha→t'';\n#$ta$virama}$ttha→t'';\n#$ta$virama}$tta→t'';\n#$ta$virama}$tha→t'';\n$ta}$x→t;\n$ta$virama→t;\n$ta→ta;\n$tha$i$u→t $strike h $strike;\n$tha}$x→th;\n$tha$virama→th;\n$tha→tha;\n$da$virama}$ha→d'';\n#$da$virama}$ddha→d'';\n#$da$virama}$dda→d'';\n#$da$virama}$dha→d'';\n$da}$x→d;\n$da$virama→d;\n$da→da;\n$dha$i$u→d $strike h $strike;\n$dha}$x→dh;\n$dha$virama→dh;\n$dha→dha;\n$na$virama}$ga→n'';\n#$na$virama}$ya→n'';\n$na}$x→n;\n$na$virama→n;\n$na→na;\n$pa$virama}$ha→p'';\n$pa}$x→p;\n$pa$virama→p;\n$pa→pa;\n$pha$i$u→p $strike h $strike;\n$pha}$x→ph;\n$pha$virama→ph;\n$pha→pha;\n$ba$virama}$ha→b'';\n$ba}$x→b;\n$ba$virama→b;\n$ba→ba;\n$bha$i$u→b $strike h $strike;\n$bha}$x→bh;\n$bha$virama→bh;\n$bha→bha;\n#$ma$virama}$ma→m'';\n$ma}$x→m;\n$ma$virama→m;\n$ma→ma;\n$ya}$x→y;\n$ya$virama→y;\n$ya→ya;\n#$ra$virama}$ha→r'';\n$ra}$x→r;\n$ra$virama→r;\n$ra→ra;\n#$vva$virama}$ha→ẇ'';\n$vva}$x→v;\n$vva$virama→v;\n$vva→va;\n#$rra$virama}$ha→ṟ'';\n$rra}$x→r;\n$rra$virama→r;\n$rra→ra;\n#$la$virama}$ha→l'';\n$la}$x→l;\n$la$virama→l;\n$la→la;\n#$lla$virama}$ha→ḷ'';\n$lla}$x→l;\n$lla$virama→l;\n$lla→la;\n$va}$x→w;\n$va$virama→w;\n$va→wa;\n#$sa$virama}$ha→s'';\n#$sa$virama}$sha→s'';\n#$sa$virama}$ssa→s'';\n#$sa$virama}$sa→s'';\n$sa}$x→s;\n$sa$virama→s;\n#for gurmukhi\n$sa$nukta}$x→sy;\n$sa$nukta$virama→sy;\n$sa$nukta→sya;\n$sa→sa;\n$sha}$x→ś;\n$sha$virama→ś;\n$sha→śa;\n$ssa}$x→sy;\n$ssa$virama→ṣ;\n$ssa→ṣa;\n$ha}$x→h;\n$ha$virama→h;\n$ha→ha;\n\n# dependent vowels (should never occur except following consonants)\n$forceIndependentMatra{$aa → ̔ā;\n$forceIndependentMatra{$ai → ̔ai;\n$forceIndependentMatra{$au → ̔au;\n$forceIndependentMatra{$ii → ̔ī;\n$forceIndependentMatra{$i → ̔i;\n$forceIndependentMatra{$uu → ̔ū;\n$forceIndependentMatra{$u → ̔u;\n$forceIndependentMatra{$rrh → ̔r̥ö;\n$forceIndependentMatra{$rh → ̔r̥ĕ;\n$forceIndependentMatra{$llh → ̔l̥ö;\n$forceIndependentMatra{$lh → ̔l̥ĕ;\n$forceIndependentMatra{$e → ̔e;\n$forceIndependentMatra{$o → ̔o;\n#extra vowels\n$forceIndependentMatra{$ce → ̔ĕ;\n$forceIndependentMatra{$co → ̔ö;\n$forceIndependentMatra{$se → ̔ĕ;\n$forceIndependentMatra{$so → ̔o;\n$forceIndependentMatra{$nukta →; # Nukta cannot appear independently or as first character\n$forceIndependentMatra{$virama →; # Virama cannot appear independently or as first character\n$i$u → $strike;\n$aa → ā;\n$ai → ai;\n$au → au;\n$ii → ī;\n$i → i;\n$uu → ū;\n$u → u;\n$rrh → r̥ö;\n$rh → r̥ĕ;\n$llh → l̥ö;\n$lh → l̥ĕ;\n$e → e;\n$o → o;\n#extra vowels\n$ce → ĕ;\n$co → ö;\n$se → ĕ;\n$so → o;\n\n#dependent vowels when following independent vowels. Generally Illegal only for roundtripping\n$waa} $x → ā;\n$wai} $x → ai;\n$wau} $x → au;\n$wii} $x → ī;\n$wi } $x → i;\n$wuu} $x → ū;\n$wu } $x → u;\n$wrr} $x → r̥ö;\n$wr } $x → r̥ĕ;\n$wll} $x → l̥ö;\n$wl } $x → l̥ĕ;\n$we } $x → e;\n$wo } $x → o;\n$wa } $x → a;\n#extra vowels\n$wce} $x → ĕ;\n$wco} $x → ö;\n$wse} $x → ĕ;\n$wso} $x → o;\n$om} $x → oṁ;\n\n# independent vowels when preceeded by vowels\n$vowels{$waa → ''ā;\n$vowels{$wai → ''ai;\n$vowels{$wau → ''au;\n$vowels{$wii → ''ī;\n$vowels{$wi → ''i;\n$vowels{$wuu → ''ū;\n$vowels{$wu → ''u;\n#$vowels{$wrr → ''r̥ö;\n#$vowels{$wr → ''r̥ĕ;\n#$vowels{$wll → ''l̥ö;\n#$vowels{$wl → ''l̥ĕ;\n$vowels{$we → ''e;\n$vowels{$wo → ''o;\n$vowels{$wa → ''a;\n#extra vowels\n$vowels{$wce → ''ĕ;\n$vowels{$wco → ''ö;\n$vowels{$wse → ''ĕ;\n$vowels{$wso → ''o;\n$vowels{$om → ''oṁ;\n\n# independent vowels (otherwise)\n$waa → ā;\n$wai → ai;\n$wau → au;\n$wii → ī;\n$wi → i;\n$wuu → ū;\n$wu → u;\n$wrr → r̥ö;\n$wr → r̥ĕ;\n$wll → l̥ö;\n$wl → l̥ĕ;\n$we → e;\n$wo → o;\n$wa → a;\n#extra vowels\n$wce → ĕ;\n$wco → ö;\n$wse → ĕ;\n$wso → o;\n$om → oṁ;\n\n# stress marks\n$avagraha → ;\n$chandrabindu → ṅġ;\n$ardhachandra → ṃ;\n$visarga → ḥ;\n\n# numbers\n$zero → 0;\n$one → 1;\n$two → 2;\n$three → 3;\n$four → 4;\n$five → 5;\n$six → 6;\n$seven → 7;\n$eight → 8;\n$nine → 9;\n$lm →;\n$ailm →;\n$aulm →;\n$dgs→'';\n$kta→t;\n# Balinese numbers are surrounded by dandas which can be removed\n$danda } [$zero$one$two$three$four$five$six$seven$eight$nine] → ' ';\n[0123456789] { $danda → ' ';\n$danda→', ';\n$doubleDanda→'. ';\n\n\\uE070→; # ABBREVIATION SIGN\n# LETTER RA WITH MIDDLE DIAGONAL\n\\uE071}$x→ra;\n\\uE071$virama→r;\n\\uE071→ra;\n# LETTER RA WITH LOWER DIAGONAL\n\\uE072}$x→ra;\n\\uE072$virama→r;\n\\uE072→ra;\n\\uE073→; # RUPEE MARK\n\\uE074→; # RUPEE SIGN\n\\uE075→; # CURRENCY NUMERATOR ONE\n\\uE076→; # CURRENCY NUMERATOR TWO\n\\uE077→; # CURRENCY NUMERATOR THREE\n\\uE078→; # CURRENCY NUMERATOR FOUR\n\\uE079→; # CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR\n\\uE07A→; # CURRENCY DENOMINATOR SIXTEEN\n\\uE07B→; # ISSHAR\n\\uE07C→; # TIPPI\n\\uE07D→; # ADDAK\n\\uE07E→; # IRI\n\\uE07F→; # URA\n\\uE080→; # EK ONKAR\n\\uE004→; # DEVANAGARI VOWEL SIGN SHORT A\n\n::NFC;\n"
},
{
"name": "Balinese-ban_001",
"rules": "::Balinese-InterIndic;\n::InterIndic-ban_001;\n"
}
]