You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

497 lines
11 KiB

This file contains ambiguous Unicode characters!

This file contains ambiguous Unicode characters that may be confused with others in your current locale. If your use case is intentional and legitimate, you can safely ignore this warning. Use the Escape button to highlight these characters.

# © 2016 and later: Unicode, Inc. and others.
# License & terms of use: http://www.unicode.org/copyright.html
# Generated using tools/cldr/cldr-to-icu/build-icu-data.xml
#
# File: InterIndic_Latin.txt
# Generated from CLDR
#
# InterIndic-Latin
#\u0E00 reserved
#consonants
$chandrabindu=\uE001;
$anusvara=\uE002;
$visarga=\uE003;
#\u0E004 reserved
# w←vowel→ represents the stand-alone form
$wa=\uE005;
$waa=\uE006;
$wi=\uE007;
$wii=\uE008;
$wu=\uE009;
$wuu=\uE00A;
$wr=\uE00B;
$wl=\uE00C;
$wce=\uE00D; # LETTER CANDRA E
$wse=\uE00E; # LETTER SHORT E
$we=\uE00F; # ए LETTER E
$wai=\uE010;
$wco=\uE011; # LETTER CANDRA O
$wso=\uE012; # LETTER SHORT O
$wo=\uE013; # ओ LETTER O
$wau=\uE014;
$ka=\uE015;
$kha=\uE016;
$ga=\uE017;
$gha=\uE018;
$nga=\uE019;
$ca=\uE01A;
$cha=\uE01B;
$ja=\uE01C;
$jha=\uE01D;
$nya=\uE01E;
$tta=\uE01F;
$ttha=\uE020;
$dda=\uE021;
$ddha=\uE022;
$nna=\uE023;
$ta=\uE024;
$tha=\uE025;
$da=\uE026;
$dha=\uE027;
$na=\uE028;
$ena=\uE029; #compatibility
$pa=\uE02A;
$pha=\uE02B;
$ba=\uE02C;
$bha=\uE02D;
$ma=\uE02E;
$ya=\uE02F;
$ra=\uE030;
$vva=\uE081;
$rra=\uE031;
$la=\uE032;
$lla=\uE033;
$ela=\uE034; #compatibility
$va=\uE035;
$sha=\uE036;
$ssa=\uE037;
$sa=\uE038;
$ha=\uE039;
#\u093A Reserved
#\u093B Reserved
$nukta=\uE03C;
$avagraha=\uE03D; # SIGN AVAGRAHA
# ←vowel→ represents the dependent form
$aa=\uE03E;
$i=\uE03F;
$ii=\uE040;
$u=\uE041;
$uu=\uE042;
$rh=\uE043;
$rrh=\uE044;
$ce=\uE045; #VOWEL SIGN CANDRA E
$se=\uE046; #VOWEL SIGN SHORT E
$e=\uE047;
$ai=\uE048;
$co=\uE049; # VOWEL SIGN CANDRA O
$so=\uE04A; # VOWEL SIGN SHORT O
$o=\uE04B; # ो
$au=\uE04C;
$virama=\uE04D;
# \u094E Reserved
# \u094F Reserved
$om=\uE050; # OM
\uE051→; # UNMAPPED STRESS SIGN UDATTA
\uE052→; # UNMAPPED STRESS SIGN ANUDATTA
\uE053→; # UNMAPPED GRAVE ACCENT
\uE054→; # UNMAPPED ACUTE ACCENT
$lm = \uE055;# Telugu Length Mark
$ailm=\uE056;# AI Length Mark
$aulm=\uE057;# AU Length Mark
#urdu compatibity forms
$uka=\uE058;
$ukha=\uE059;
$ugha=\uE05A;
$ujha=\uE05B;
$uddha=\uE05C;
$udha=\uE05D;
$ufa=\uE05E;
$uya=\uE05F;
$wrr=\uE060;
$wll=\uE061;
$lh=\uE062;
$llh=\uE063;
$danda=\uE064;
$doubleDanda=\uE065;
$zero=\uE066; # DIGIT ZERO
$one=\uE067; # DIGIT ONE
$two=\uE068; # DIGIT TWO
$three=\uE069; # DIGIT THREE
$four=\uE06A; # DIGIT FOUR
$five=\uE06B; # DIGIT FIVE
$six=\uE06C; # DIGIT SIX
$seven=\uE06D; # DIGIT SEVEN
$eight=\uE06E; # DIGIT EIGHT
$nine=\uE06F; # DIGIT NINE
# Glottal stop
$dgs=\uE082;
#Khanda-ta
$kta=\uE083;
$depVowelAbove=[\uE03E-\uE040\uE045-\uE04C];
$depVowelBelow=[\uE041-\uE044];
# $x was originally called '§'; $z was '%'
$x=[$aa$ai$au$ii$i$uu$u$rrh$rh$lh$llh$e$o$se$ce$so$co];
$z=[bcdfghjklmnpqrstvwxyz];
$vowels=[aeiour\u0304\u0325\u0306];
$forceIndependentMatra = [^[[:L:][\u0300-\u034C]]];
######################################################################
# convert from Native letters to Latin letters
######################################################################
#transliterations for anusvara
$anusvara} [$ka$kha$ga$gha$nga] → n\u0307;
$anusvara} [$ca$cha$ja$jha$nya] → n\u0304;
$anusvara} [$tta$ttha$dda$ddha$nna] → n\u0323;
$anusvara} [$ta$tha$da$dha$na] → n;
$anusvara} [$pa$pha$ba$bha$ma] → m;
$anusvara} [$ya$ra$lla$la$va$ssa$sha$sa$ha] → n;
$anusvara→ m\u0307;
# Urdu compatibility
$ya$nukta}$x → y\u0307;
$ya$nukta$virama → y\u0307;
$ya$nukta → y\u0307a;
$la$nukta }$x → l\u0331;
$la$nukta$virama → l\u0331;
$la$nukta → l\u0331a;
$na$nukta }$x → n\u0331;
$na$nukta$virama → n\u0331;
$na$nukta → n\u0331a;
$ena }$x → n\u0331;
$ena$virama → n\u0331;
$ena → n\u0331a;
$uka → qa;
$ka$nukta }$x → q;
$ka$nukta$virama → q;
$ka$nukta → qa;
$kha$nukta }$x → k\u0331h\u0331;
$kha$nukta$virama → k\u0331h\u0331;
$kha$nukta → k\u0331h\u0331a;
$ukha$virama → k\u0331h\u0331;
$ukha → k\u0331h\u0331a;
$ugha → g\u0307a;
$ga$nukta }$x → g\u0307;
$ga$nukta$virama → g\u0307;
$ga$nukta → g\u0307a;
$ujha → za;
$ja$nukta }$x → z;
$ja$nukta$virama → z;
$ja$nukta → za;
$ddha$nukta}$x → r\u0323h;
$ddha$nukta$virama → r\u0323h;
$ddha$nukta → r\u0323ha;
$uddha}$x → r\u0323;
$uddha$virama → r\u0323;
$uddha → r\u0323a;
$udha → r\u0323a;
$dda$nukta}$x → r\u0323;
$dda$nukta$virama → r\u0323;
$dda$nukta → r\u0323a;
$pha$nukta }$x → f;
$pha$nukta$virama → f;
$pha$nukta → fa;
$ufa }$x → f;
$ufa$virama → f;
$ufa → fa;
$ra$nukta}$x → r\u0331;
$ra$nukta$virama → r\u0331;
$ra$nukta → r\u0331a;
$lla$nukta}$x → l\u0331;
$lla$nukta$virama → l\u0331;
$lla$nukta → l\u0331a;
$ela}$x → l\u0331;
$ela$virama → l\u0331;
$ela → l\u0331a;
$uya}$x → y\u0307;
$uya$virama → y\u0307;
$uya → y\u0307a;
# normal consonants
$ka$virama}$ha→k'';
$ka}$x→k;
$ka$virama→k;
$ka→ka;
$kha}$x→kh;
$kha$virama→kh;
$kha→kha;
$ga$virama}$ha→g'';
$ga}$x→g;
$ga$virama→g;
$ga→ga;
$gha}$x→gh;
$gha$virama→gh;
$gha→gha;
$nga}$x→n\u0307;
$nga$virama→n\u0307;
$nga→n\u0307a;
$ca$virama}$ha→c'';
$ca}$x→c;
$ca$virama→c;
$ca→ca;
$cha}$x→ch;
$cha$virama→ch;
$cha→cha;
$ja$virama}$ha→j'';
$ja}$x→j;
$ja$virama→j;
$ja→ja;
$jha}$x→jh;
$jha$virama→jh;
$jha→jha;
$nya }$x→n\u0303;
$nya$virama→n\u0303;
$nya → n\u0303a;
$tta$virama}$ha→t\u0323'';
$tta}$x→t\u0323;
$tta$virama→t\u0323;
$tta→t\u0323a;
$ttha}$x→t\u0323h;
$ttha$virama→t\u0323h;
$ttha→t\u0323ha;
$dda}$x$ha→d\u0323'';
$dda}$x→d\u0323;
$dda$virama→d\u0323;
$dda→d\u0323a;
$ddha}$x→d\u0323h;
$ddha$virama→d\u0323h;
$ddha→d\u0323ha;
$nna}$x→n\u0323;
$nna$virama→n\u0323;
$nna→n\u0323a;
$ta$virama}$ha→t'';
$ta$virama}$ttha→t'';
$ta$virama}$tta→t'';
$ta$virama}$tha→t'';
$ta}$x→t;
$ta$virama→t;
$ta→ta;
$tha}$x→th;
$tha$virama→th;
$tha→tha;
$da$virama}$ha→d'';
$da$virama}$ddha→d'';
$da$virama}$dda→d'';
$da$virama}$dha→d'';
$da}$x→d;
$da$virama→d;
$da→da;
$dha}$x→dh;
$dha$virama→dh;
$dha→dha;
$na$virama}$ga→n'';
$na$virama}$ya→n'';
$na}$x→n;
$na$virama→n;
$na→na;
$pa$virama}$ha→p'';
$pa}$x→p;
$pa$virama→p;
$pa→pa;
$pha}$x→ph;
$pha$virama→ph;
$pha→pha;
$ba$virama}$ha→b'';
$ba}$x→b;
$ba$virama→b;
$ba→ba;
$bha}$x→bh;
$bha$virama→bh;
$bha→bha;
$ma$virama}$ma→m'';
$ma}$x→m;
$ma$virama→m;
$ma→ma;
$ya}$x→y;
$ya$virama→y;
$ya→ya;
$ra$virama}$ha→r'';
$ra}$x→r;
$ra$virama→r;
$ra→ra;
$vva$virama}$ha→w\u0307'';
$vva}$x→w\u0307;
$vva$virama→w\u0307;
$vva→w\u0307a;
$rra$virama}$ha→r\u0331'';
$rra}$x→r\u0331;
$rra$virama→r\u0331;
$rra→r\u0331a;
$la$virama}$ha→l'';
$la}$x→l;
$la$virama→l;
$la→la;
$lla$virama}$ha→l\u0323'';
$lla}$x→l\u0323;
$lla$virama→l\u0323;
$lla→l\u0323a;
$va}$x→v;
$va$virama→v;
$va→va;
$sa$virama}$ha→s'';
$sa$virama}$sha→s'';
$sa$virama}$ssa→s'';
$sa$virama}$sa→s'';
$sa}$x→s;
$sa$virama→s;
#for gurmukhi
$sa$nukta}$x→s\u0301;
$sa$nukta$virama→s\u0301;
$sa$nukta→s\u0301a;
$sa→sa;
$sha}$x→s\u0301;
$sha$virama→s\u0301;
$sha→s\u0301a;
$ssa}$x→s\u0323;
$ssa$virama→s\u0323;
$ssa→s\u0323a;
$ha}$x→h;
$ha$virama→h;
$ha→ha;
# dependent vowels (should never occur except following consonants)
$forceIndependentMatra{$aa → \u0314a\u0304;
$forceIndependentMatra{$ai → \u0314ai;
$forceIndependentMatra{$au → \u0314au;
$forceIndependentMatra{$ii → \u0314i\u0304;
$forceIndependentMatra{$i → \u0314i;
$forceIndependentMatra{$uu → \u0314u\u0304;
$forceIndependentMatra{$u → \u0314u;
$forceIndependentMatra{$rrh → \u0314r\u0325\u0304;
$forceIndependentMatra{$rh → \u0314r\u0325;
$forceIndependentMatra{$llh → \u0314l\u0325\u0304;
$forceIndependentMatra{$lh → \u0314l\u0325;
$forceIndependentMatra{$e → \u0314e\u0304;
$forceIndependentMatra{$o → \u0314o\u0304;
#extra vowels
$forceIndependentMatra{$ce → \u0314e\u0306;
$forceIndependentMatra{$co → \u0314o\u0306;
$forceIndependentMatra{$se → \u0314e;
$forceIndependentMatra{$so → \u0314o;
$forceIndependentMatra{$nukta →; # Nukta cannot appear independently or as first character
$forceIndependentMatra{$virama →; # Virama cannot appear independently or as first character
$aa → a\u0304;
$ai → ai;
$au → au;
$ii → i\u0304;
$i → i;
$uu → u\u0304;
$u → u;
$rrh → r\u0325\u0304;
$rh → r\u0325;
$llh → l\u0325\u0304;
$lh → l\u0325;
$e → e\u0304;
$o → o\u0304;
#extra vowels
$ce → e\u0306;
$co → o\u0306;
$se → e;
$so → o;
#dependent vowels when following independent vowels. Generally Illegal only for roundtripping
$waa} $x → a\u0304\u0314;
$wai} $x → ai\u0314;
$wau} $x → au\u0314;
$wii} $x → i\u0304\u0314;
$wi } $x → i\u0314;
$wuu} $x → u\u0304\u0314;
$wu } $x → u\u0314;
$wrr} $x → r\u0325\u0304\u0314;
$wr } $x → r\u0325\u0314;
$wll} $x → l\u0325\u0304\u0314;
$wl } $x → l\u0325\u0314;
$we } $x → e\u0304\u0314;
$wo } $x → o\u0304\u0314;
$wa } $x → a\u0314;
#extra vowels
$wce} $x → e\u0306\u0314;
$wco} $x → o\u0306\u0314;
$wse} $x → e\u0314;
$wso} $x → o\u0314;
$om} $x → ''om\u0314;
# independent vowels when preceeded by vowels
$vowels{$waa → ''a\u0304;
$vowels{$wai → ''ai;
$vowels{$wau → ''au;
$vowels{$wii → ''i\u0304;
$vowels{$wi → ''i;
$vowels{$wuu → ''u\u0304;
$vowels{$wu → ''u;
$vowels{$wrr → ''r\u0325\u0304;
$vowels{$wr → ''r\u0325;
$vowels{$wll → ''l\u0325\u0304;
$vowels{$wl → ''l\u0325;
$vowels{$we → ''e\u0304;
$vowels{$wo → ''o\u0304;
$vowels{$wa → ''a;
#extra vowels
$vowels{$wce → ''e\u0306;
$vowels{$wco → ''o\u0306;
$vowels{$wse → ''e;
$vowels{$wso → ''o;
# independent vowels (otherwise)
$waa → a\u0304;
$wai → ai;
$wau → au;
$wii → i\u0304;
$wi → i;
$wuu → u\u0304;
$wu → u;
$wrr → r\u0325\u0304;
$wr → r\u0325;
$wll → l\u0325\u0304;
$wl → l\u0325;
$we → e\u0304;
$wo → o\u0304;
$wa → a;
#extra vowels
$wce → e\u0306;
$wco → o\u0306;
$wse → e;
$wso → o;
$om → ''om;
#stress marks
$avagraha → \u0315;
$chandrabindu$anusvara→\u0303;
$chandrabindu → m\u0310;
$visarga→h\u0323;
#numbers
$zero → 0;
$one → 1;
$two → 2;
$three → 3;
$four → 4;
$five → 5;
$six → 6;
$seven → 7;
$eight → 8;
$nine → 9;
$lm →;
$ailm →;
$aulm →;
$dgs→ʔ;
$kta→t\u0331;
$danda→'.';
$doubleDanda→'.';
\uE070→; # ABBREVIATION SIGN
# LETTER RA WITH MIDDLE DIAGONAL
\uE071}$x→ra;
\uE071$virama→r;
\uE071→ra;
# LETTER RA WITH LOWER DIAGONAL
\uE072}$x→ra;
\uE072$virama→r;
\uE072→ra;
\uE073→; # RUPEE MARK
\uE074→; # RUPEE SIGN
\uE075→; # CURRENCY NUMERATOR ONE
\uE076→; # CURRENCY NUMERATOR TWO
\uE077→; # CURRENCY NUMERATOR THREE
\uE078→; # CURRENCY NUMERATOR FOUR
\uE079→; # CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR
\uE07A→; # CURRENCY DENOMINATOR SIXTEEN
\uE07B→; # ISSHAR
\uE07C→; # TIPPI
\uE07D→; # ADDAK
\uE07E→; # IRI
\uE07F→; # URA
\uE080→; # EK ONKAR
\uE004→; # DEVANAGARI VOWEL SIGN SHORT A