<?xml version="1.0" encoding="UTF-8" ?> <!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd"> <!-- Copyright © 1991-2013 Unicode, Inc. CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/) For terms of use, see http://www.unicode.org/copyright.html --> <supplementalData> <version number="$Revision: 12137 $"/> <transforms> <transform source="InterIndic" target="Latin" direction="forward" visibility="internal"> <tRule> # InterIndic-Latin #\u0E00 reserved #consonants $chandrabindu=\uE001; $anusvara=\uE002; $visarga=\uE003; #\u0E004 reserved # w←vowel→ represents the stand-alone form $wa=\uE005; $waa=\uE006; $wi=\uE007; $wii=\uE008; $wu=\uE009; $wuu=\uE00A; $wr=\uE00B; $wl=\uE00C; $wce=\uE00D; # LETTER CANDRA E $wse=\uE00E; # LETTER SHORT E $we=\uE00F; # ए LETTER E $wai=\uE010; $wco=\uE011; # LETTER CANDRA O $wso=\uE012; # LETTER SHORT O $wo=\uE013; # ओ LETTER O $wau=\uE014; $ka=\uE015; $kha=\uE016; $ga=\uE017; $gha=\uE018; $nga=\uE019; $ca=\uE01A; $cha=\uE01B; $ja=\uE01C; $jha=\uE01D; $nya=\uE01E; $tta=\uE01F; $ttha=\uE020; $dda=\uE021; $ddha=\uE022; $nna=\uE023; $ta=\uE024; $tha=\uE025; $da=\uE026; $dha=\uE027; $na=\uE028; $ena=\uE029; #compatibility $pa=\uE02A; $pha=\uE02B; $ba=\uE02C; $bha=\uE02D; $ma=\uE02E; $ya=\uE02F; $ra=\uE030; $vva=\uE081; $rra=\uE031; $la=\uE032; $lla=\uE033; $ela=\uE034; #compatibility $va=\uE035; $sha=\uE036; $ssa=\uE037; $sa=\uE038; $ha=\uE039; #\u093A Reserved #\u093B Reserved $nukta=\uE03C; $avagraha=\uE03D; # SIGN AVAGRAHA # ←vowel→ represents the dependent form $aa=\uE03E; $i=\uE03F; $ii=\uE040; $u=\uE041; $uu=\uE042; $rh=\uE043; $rrh=\uE044; $ce=\uE045; #VOWEL SIGN CANDRA E $se=\uE046; #VOWEL SIGN SHORT E $e=\uE047; $ai=\uE048; $co=\uE049; # VOWEL SIGN CANDRA O $so=\uE04A; # VOWEL SIGN SHORT O $o=\uE04B; # ो $au=\uE04C; $virama=\uE04D; # \u094E Reserved # \u094F Reserved $om=\uE050; # OM \uE051→; # UNMAPPED STRESS SIGN UDATTA \uE052→; # UNMAPPED STRESS SIGN ANUDATTA \uE053→; # UNMAPPED GRAVE ACCENT \uE054→; # UNMAPPED ACUTE ACCENT $lm = \uE055;# Telugu Length Mark $ailm=\uE056;# AI Length Mark $aulm=\uE057;# AU Length Mark #urdu compatibity forms $uka=\uE058; $ukha=\uE059; $ugha=\uE05A; $ujha=\uE05B; $uddha=\uE05C; $udha=\uE05D; $ufa=\uE05E; $uya=\uE05F; $wrr=\uE060; $wll=\uE061; $lh=\uE062; $llh=\uE063; $danda=\uE064; $doubleDanda=\uE065; $zero=\uE066; # DIGIT ZERO $one=\uE067; # DIGIT ONE $two=\uE068; # DIGIT TWO $three=\uE069; # DIGIT THREE $four=\uE06A; # DIGIT FOUR $five=\uE06B; # DIGIT FIVE $six=\uE06C; # DIGIT SIX $seven=\uE06D; # DIGIT SEVEN $eight=\uE06E; # DIGIT EIGHT $nine=\uE06F; # DIGIT NINE # Glottal stop $dgs=\uE082; #Khanda-ta $kta=\uE083; $depVowelAbove=[\uE03E-\uE040\uE045-\uE04C]; $depVowelBelow=[\uE041-\uE044]; # $x was originally called '§'; $z was '%' $x=[$aa$ai$au$ii$i$uu$u$rrh$rh$lh$llh$e$o$se$ce$so$co]; $z=[bcdfghjklmnpqrstvwxyz]; $vowels=[aeiour̥̄̆]; $forceIndependentMatra = [^[[:L:][̀-͌]]]; ###################################################################### # convert from Native letters to Latin letters ###################################################################### #transliterations for anusvara $anusvara} [$ka$kha$ga$gha$nga] → ṅ; $anusvara} [$ca$cha$ja$jha$nya] → n̄; $anusvara} [$tta$ttha$dda$ddha$nna] → ṇ; $anusvara} [$ta$tha$da$dha$na] → n; $anusvara} [$pa$pha$ba$bha$ma] → m; $anusvara} [$ya$ra$lla$la$va$ssa$sha$sa$ha] → n; $anusvara→ ṁ; # Urdu compatibility $ya$nukta}$x → ẏ; $ya$nukta$virama → ẏ; $ya$nukta → ẏa; $la$nukta }$x → ḻ; $la$nukta$virama → ḻ; $la$nukta → ḻa; $na$nukta }$x → ṉ; $na$nukta$virama → ṉ; $na$nukta → ṉa; $ena }$x → ṉ; $ena$virama → ṉ; $ena → ṉa; $uka → qa; $ka$nukta }$x → q; $ka$nukta$virama → q; $ka$nukta → qa; $kha$nukta }$x → ḵẖ; $kha$nukta$virama → ḵẖ; $kha$nukta → ḵẖa; $ukha$virama → ḵẖ; $ukha → ḵẖa; $ugha → ġa; $ga$nukta }$x → ġ; $ga$nukta$virama → ġ; $ga$nukta → ġa; $ujha → za; $ja$nukta }$x → z; $ja$nukta$virama → z; $ja$nukta → za; $ddha$nukta}$x → ṛh; $ddha$nukta$virama → ṛh; $ddha$nukta → ṛha; $uddha}$x → ṛ; $uddha$virama → ṛ; $uddha → ṛa; $udha → ṛa; $dda$nukta}$x → ṛ; $dda$nukta$virama → ṛ; $dda$nukta → ṛa; $pha$nukta }$x → f; $pha$nukta$virama → f; $pha$nukta → fa; $ufa }$x → f; $ufa$virama → f; $ufa → fa; $ra$nukta}$x → ṟ; $ra$nukta$virama → ṟ; $ra$nukta → ṟa; $lla$nukta}$x → ḻ; $lla$nukta$virama → ḻ; $lla$nukta → ḻa; $ela}$x → ḻ; $ela$virama → ḻ; $ela → ḻa; $uya}$x → ẏ; $uya$virama → ẏ; $uya → ẏa; # normal consonants $ka$virama}$ha→k''; $ka}$x→k; $ka$virama→k; $ka→ka; $kha}$x→kh; $kha$virama→kh; $kha→kha; $ga$virama}$ha→g''; $ga}$x→g; $ga$virama→g; $ga→ga; $gha}$x→gh; $gha$virama→gh; $gha→gha; $nga}$x→ṅ; $nga$virama→ṅ; $nga→ṅa; $ca$virama}$ha→c''; $ca}$x→c; $ca$virama→c; $ca→ca; $cha}$x→ch; $cha$virama→ch; $cha→cha; $ja$virama}$ha→j''; $ja}$x→j; $ja$virama→j; $ja→ja; $jha}$x→jh; $jha$virama→jh; $jha→jha; $nya }$x→ñ; $nya$virama→ñ; $nya → ña; $tta$virama}$ha→ṭ''; $tta}$x→ṭ; $tta$virama→ṭ; $tta→ṭa; $ttha}$x→ṭh; $ttha$virama→ṭh; $ttha→ṭha; $dda}$x$ha→ḍ''; $dda}$x→ḍ; $dda$virama→ḍ; $dda→ḍa; $ddha}$x→ḍh; $ddha$virama→ḍh; $ddha→ḍha; $nna}$x→ṇ; $nna$virama→ṇ; $nna→ṇa; $ta$virama}$ha→t''; $ta$virama}$ttha→t''; $ta$virama}$tta→t''; $ta$virama}$tha→t''; $ta}$x→t; $ta$virama→t; $ta→ta; $tha}$x→th; $tha$virama→th; $tha→tha; $da$virama}$ha→d''; $da$virama}$ddha→d''; $da$virama}$dda→d''; $da$virama}$dha→d''; $da}$x→d; $da$virama→d; $da→da; $dha}$x→dh; $dha$virama→dh; $dha→dha; $na$virama}$ga→n''; $na$virama}$ya→n''; $na}$x→n; $na$virama→n; $na→na; $pa$virama}$ha→p''; $pa}$x→p; $pa$virama→p; $pa→pa; $pha}$x→ph; $pha$virama→ph; $pha→pha; $ba$virama}$ha→b''; $ba}$x→b; $ba$virama→b; $ba→ba; $bha}$x→bh; $bha$virama→bh; $bha→bha; $ma$virama}$ma→m''; $ma}$x→m; $ma$virama→m; $ma→ma; $ya}$x→y; $ya$virama→y; $ya→ya; $ra$virama}$ha→r''; $ra}$x→r; $ra$virama→r; $ra→ra; $vva$virama}$ha→ẇ''; $vva}$x→ẇ; $vva$virama→ẇ; $vva→ẇa; $rra$virama}$ha→ṟ''; $rra}$x→ṟ; $rra$virama→ṟ; $rra→ṟa; $la$virama}$ha→l''; $la}$x→l; $la$virama→l; $la→la; $lla$virama}$ha→ḷ''; $lla}$x→ḷ; $lla$virama→ḷ; $lla→ḷa; $va}$x→v; $va$virama→v; $va→va; $sa$virama}$ha→s''; $sa$virama}$sha→s''; $sa$virama}$ssa→s''; $sa$virama}$sa→s''; $sa}$x→s; $sa$virama→s; #for gurmukhi $sa$nukta}$x→ś; $sa$nukta$virama→ś; $sa$nukta→śa; $sa→sa; $sha}$x→ś; $sha$virama→ś; $sha→śa; $ssa}$x→ṣ; $ssa$virama→ṣ; $ssa→ṣa; $ha}$x→h; $ha$virama→h; $ha→ha; # dependent vowels (should never occur except following consonants) $forceIndependentMatra{$aa → ̔ā; $forceIndependentMatra{$ai → ̔ai; $forceIndependentMatra{$au → ̔au; $forceIndependentMatra{$ii → ̔ī; $forceIndependentMatra{$i → ̔i; $forceIndependentMatra{$uu → ̔ū; $forceIndependentMatra{$u → ̔u; $forceIndependentMatra{$rrh → ̔r̥̄; $forceIndependentMatra{$rh → ̔r̥; $forceIndependentMatra{$llh → ̔l̥̄; $forceIndependentMatra{$lh → ̔l̥; $forceIndependentMatra{$e → ̔ē; $forceIndependentMatra{$o → ̔ō; #extra vowels $forceIndependentMatra{$ce → ̔ĕ; $forceIndependentMatra{$co → ̔ŏ; $forceIndependentMatra{$se → ̔e; $forceIndependentMatra{$so → ̔o; $forceIndependentMatra{$nukta →; # Nukta cannot appear independently or as first character $forceIndependentMatra{$virama →; # Virama cannot appear independently or as first character $aa → ā; $ai → ai; $au → au; $ii → ī; $i → i; $uu → ū; $u → u; $rrh → r̥̄; $rh → r̥; $llh → l̥̄; $lh → l̥; $e → ē; $o → ō; #extra vowels $ce → ĕ; $co → ŏ; $se → e; $so → o; #dependent vowels when following independent vowels. Generally Illegal only for roundtripping $waa} $x → ā̔; $wai} $x → ai̔; $wau} $x → au̔; $wii} $x → ī̔; $wi } $x → i̔; $wuu} $x → ū̔; $wu } $x → u̔; $wrr} $x → r̥̄̔; $wr } $x → r̥̔; $wll} $x → l̥̄̔; $wl } $x → l̥̔; $we } $x → ē̔; $wo } $x → ō̔; $wa } $x → a̔; #extra vowels $wce} $x → ĕ̔; $wco} $x → ŏ̔; $wse} $x → e̔; $wso} $x → o̔; $om} $x → ''om̔; # independent vowels when preceeded by vowels $vowels{$waa → ''ā; $vowels{$wai → ''ai; $vowels{$wau → ''au; $vowels{$wii → ''ī; $vowels{$wi → ''i; $vowels{$wuu → ''ū; $vowels{$wu → ''u; $vowels{$wrr → ''r̥̄; $vowels{$wr → ''r̥; $vowels{$wll → ''l̥̄; $vowels{$wl → ''l̥; $vowels{$we → ''ē; $vowels{$wo → ''ō; $vowels{$wa → ''a; #extra vowels $vowels{$wce → ''ĕ; $vowels{$wco → ''ŏ; $vowels{$wse → ''e; $vowels{$wso → ''o; # independent vowels (otherwise) $waa → ā; $wai → ai; $wau → au; $wii → ī; $wi → i; $wuu → ū; $wu → u; $wrr → r̥̄; $wr → r̥; $wll → l̥̄; $wl → l̥; $we → ē; $wo → ō; $wa → a; #extra vowels $wce → ĕ; $wco → ŏ; $wse → e; $wso → o; $om → ''om; #stress marks $avagraha → ̕; $chandrabindu$anusvara→̃; $chandrabindu → m̐; $visarga→ḥ; #numbers $zero → 0; $one → 1; $two → 2; $three → 3; $four → 4; $five → 5; $six → 6; $seven → 7; $eight → 8; $nine → 9; $lm →; $ailm →; $aulm →; $dgs→ʔ; $kta→ṯ; $danda→'.'; $doubleDanda→'.'; \uE070→; # ABBREVIATION SIGN # LETTER RA WITH MIDDLE DIAGONAL \uE071}$x→ra; \uE071$virama→r; \uE071→ra; # LETTER RA WITH LOWER DIAGONAL \uE072}$x→ra; \uE072$virama→r; \uE072→ra; \uE073→; # RUPEE MARK \uE074→; # RUPEE SIGN \uE075→; # CURRENCY NUMERATOR ONE \uE076→; # CURRENCY NUMERATOR TWO \uE077→; # CURRENCY NUMERATOR THREE \uE078→; # CURRENCY NUMERATOR FOUR \uE079→; # CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR \uE07A→; # CURRENCY DENOMINATOR SIXTEEN \uE07B→; # ISSHAR \uE07C→; # TIPPI \uE07D→; # ADDAK \uE07E→; # IRI \uE07F→; # URA \uE080→; # EK ONKAR \uE004→; # DEVANAGARI VOWEL SIGN SHORT A </tRule> </transform> </transforms> </supplementalData>