X-Git-Url: https://git.saurik.com/apple/icu.git/blobdiff_plain/374ca955a76ecab1204ca8bfa63ff9238d998416..249c4c5ea9376c24572daf9c2effa7484a282f14:/icuSources/data/translit/InterIndic_Gurmukhi.txt diff --git a/icuSources/data/translit/InterIndic_Gurmukhi.txt b/icuSources/data/translit/InterIndic_Gurmukhi.txt index a2236da9..c04b54c8 100644 --- a/icuSources/data/translit/InterIndic_Gurmukhi.txt +++ b/icuSources/data/translit/InterIndic_Gurmukhi.txt @@ -1,147 +1,148 @@ -#-------------------------------------------------------------------- -# Copyright (c) 1999-2004, International Business Machines -# Corporation and others. All Rights Reserved. -#-------------------------------------------------------------------- +# © 2016 and later: Unicode, Inc. and others. +# License & terms of use: http://www.unicode.org/copyright.html#License +# +# File: InterIndic_Gurmukhi.txt +# Generated from CLDR +# # InterIndic-Gurmukhi #:: NFD (NFC) ; -$vowel = [\u0A05-\u0A14 \u0A3e-\u0A4D]; -$consonant = [\u0A15-\u0A39]; - -\ue001>\u0a01; # SIGN CHANDRABINDU +$vowel = [ਅ-ਔ ਾ-\u0A4D]; +$consonant = [ਕ-ਹ]; +\uE001→\u0A01; # SIGN CHANDRABINDU #rules for BINDI - # Anusvara is equivalent to BINDI when preceeded by a vowel -$vowel{\ue002>\u0a02; # SIGN ANUSVARA (\u0a02 = SIGN BINDI) +$vowel{\uE002→\u0A02; # SIGN ANUSVARA (\u0A02 = SIGN BINDI) # else is equivalent to TIPPI -$consonant{\ue002>\u0a70; # SIGN TIPPI -\ue002>\u0a02; - -\ue003>; # FALLBACK BLOW AWAY SIGN VISARGA -\uE004>\u0a05; # FALLBACK TO LETTER A -\ue005>\u0a05; # LETTER A -\ue006>\u0a06; # LETTER AA -\ue007>\u0a07; # LETTER I -\ue008>\u0a08; # LETTER II -\ue009>\u0a09; # LETTER U -\ue00a>\u0a0a; # LETTER UU -\ue00b>\u0a30\u0a3f; # REMAP (indicExceptions.txt): \u0a0b>\u0a30\u0a3f = LETTER VOCALIC R>LETTER RA.VOWEL SIGN I -\ue00c>\u0a33; # FALLBACK -\ue00d>\u0a0f; # FALLBACK -\ue00e>\u0a0f; # FALLBACK -\ue00f>\u0a0f; # LETTER EE -\ue010>\u0a10; # LETTER AI -\ue011>\u0a13; # FALLBACK -\ue012>\u0a13; # FALLBACK -\ue013>\u0a13; # LETTER OO -\ue014>\u0a14; # LETTER AU -\ue015>\u0a15; # LETTER KA -\ue016>\u0a16; # LETTER KHA -\ue017>\u0a17; # LETTER GA -\ue018>\u0a18; # LETTER GHA -\ue019>\u0a19; # LETTER NGA -\ue01a>\u0a1a; # LETTER CA -\ue01b>\u0a1b; # LETTER CHA -\ue01c>\u0a1c; # LETTER JA -\ue01d>\u0a1d; # LETTER JHA -\ue01e>\u0a1e; # LETTER NYA -\ue01f>\u0a1f; # LETTER TTA -\ue020>\u0a20; # LETTER TTHA -\ue021>\u0a21; # LETTER DDA -\ue022>\u0a22; # LETTER DDHA -\ue023>\u0a23; # LETTER NNA -\ue024>\u0a24; # LETTER TA -\ue025>\u0a25; # LETTER THA -\ue026>\u0a26; # LETTER DA -\ue027>\u0a27; # LETTER DHA -\ue028>\u0a28; # LETTER NA -\ue029>\u0a28\u0a3c; # REMAP (indicExceptions.txt): \u0a29>\u0a28 = LETTER NNNA>LETTER NA -\ue02a>\u0a2a; # LETTER PA -\ue02b>\u0a2b; # LETTER PHA -\ue02c>\u0a2c; # LETTER BA -\ue02d>\u0a2d; # LETTER BHA -\ue02e>\u0a2e; # LETTER MA -\ue02f>\u0a2f; # LETTER YA -\ue030>\u0a30; # LETTER RA -\ue031>\u0a30\u0a3c; # FALLBACK LETTER RA+NUKTA -\ue032>\u0a32; # LETTER LA -\ue033>\u0a33; # LETTER LLA -\ue034>\u0a33; # REMAP (indicExceptions.txt): \u0a34>\u0a33 = LETTER LLLA>LETTER LLA -\ue035>\u0a35; # LETTER VA -\ue036>\u0a36; # LETTER SHA -\ue037>\u0a36; # REMAP (indicExceptions.txt): \u0a37>\u0a36 = LETTER SSA>LETTER SHA -\ue038>\u0a38; # LETTER SA -\ue039>\u0a39; # LETTER HA -\ue03c>\u0a3c; # SIGN NUKTA -\ue03d>; # FALLBACK BLOW AWAY SIGN AVAGRAHA -\ue03e>\u0a3e; # VOWEL SIGN AA -\ue03f>\u0a3f; # VOWEL SIGN I -\ue040>\u0a40; # VOWEL SIGN II -\ue041>\u0a41; # VOWEL SIGN U -\ue042>\u0a42; # VOWEL SIGN UU -\ue043>; # FALLBACK BLOW AWAY VOWEL SIGN VOCALIC R -\ue044>; # FALLBACK BLOW AWAY VOWEL SIGN VOCALIC RR -\ue045>\u0a48; # REMAP (indicExceptions.txt): \u0a45>\u0a48 = VOWEL SIGN CANDRA E>VOWEL SIGN AI -\ue046>\u0a47; # FALLABCK -\ue047>\u0a47; # VOWEL SIGN EE -\ue048>\u0a48; # VOWEL SIGN AI -\ue049>\u0a4c; # REMAP (indicExceptions.txt): \u0a49>\u0a4c = VOWEL SIGN CANDRA O>VOWEL SIGN AU -\ue04a>\u0a4b; # FALLBACK -\ue04b>\u0a4b; # VOWEL SIGN OO -\ue04c>\u0a4c; # VOWEL SIGN AU -\ue04d>\u0a4d; # SIGN VIRAMA -\ue050>\u0a0f\u0a02; # FALLBACK to OO+BINDI : OM -\ue051>; -\ue052>; -\ue053>; -\ue054>; -\ue055>; # FALLBACK BLOW AWAY LENGTH MARK -\ue056>\u0a48; # REMAP (indicExceptions.txt): \u0a56>\u0a48 = AI LENGTH MARK>VOWEL SIGN AI -\ue057>\u0a4c; # REMAP (indicExceptions.txt): \u0a57>\u0a4c = AU LENGTH MARK>VOWEL SIGN AU -\ue058>\u0a15\u0a3c; # FALLBACK RA+ NUKTA -\ue059>\u0a59; # LETTER KHHA -\ue05a>\u0a5a; # LETTER GHHA -\ue05b>\u0a5b; # LETTER ZA -\ue05c>\u0a5c; # LETTER RRA -\ue05d>\u0a22\u0a3c; # REMAP (indicExceptions.txt): \u0a5d>\u0a22\u0a3c = LETTER RHA>LETTER DDHA.SIGN NUKTA -\ue05e>\u0a5e; # LETTER FA -\ue05f>\u0a2f\u0a3c; # REMAP (indicExceptions.txt): \u0a5f>\u0a2f = LETTER YYA>LETTER YA -\ue060>\u0a30\u0a3f; # REMAP (indicExceptions.txt): \u0a60>\u0a30\u0a3f = LETTER VOCALIC RR>LETTER RA.VOWEL SIGN I -\ue061>\u0a32\u0a3c; # -\ue062>\u0a3f\u0a3c; # REMAP (indicExceptions.txt): \u0a62>\u0a3f\u0a3c = VOWEL SIGN VOCALIC L>VOWEL SIGN I.SIGN NUKTA -\ue063>\u0a40\u0a3c; # REMAP (indicExceptions.txt): \u0a63>\u0a40\u0a3c = VOWEL SIGN VOCALIC LL>VOWEL SIGN II.SIGN NUKTA -\uE064>\u0964; # DANDA -\uE065>\u0965; # DOUBLE DANDA -\ue066>\u0a66; # DIGIT ZERO -\ue067>\u0a67; # DIGIT ONE -\ue068>\u0a68; # DIGIT TWO -\ue069>\u0a69; # DIGIT THREE -\ue06a>\u0a6a; # DIGIT FOUR -\ue06b>\u0a6b; # DIGIT FIVE -\ue06c>\u0a6c; # DIGIT SIX -\ue06d>\u0a6d; # DIGIT SEVEN -\ue06e>\u0a6e; # DIGIT EIGHT -\ue06f>\u0a6f; # DIGIT NINE -\ue070>; # ABBREVIATION SIGN -\ue071>\u0a30; # LETTER RA WITH MIDDLE DIAGONAL -\ue072>\u0a30; # LETTER RA WITH LOWER DIAGONAL -\ue073>; # RUPEE MARK -\ue074>; # RUPEE SIGN -\ue075>; # CURRENCY NUMERATOR ONE -\ue076>; # CURRENCY NUMERATOR TWO -\ue077>; # CURRENCY NUMERATOR THREE -\ue078>; # CURRENCY NUMERATOR FOUR -\ue079>; # CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR -\ue07A>; # CURRENCY DENOMINATOR SIXTEEN -\ue07B>; # ISSHAR -\uE07C>\u0a70; # TIPPI -\uE07D>\u0a71; # ADDAK -\uE07E>\u0a72; # IRI -\uE07F>\u0a73; # URA -\uE080>\u0a74; # EK ONKAR -\uE081>\u0a35; # FALLBACK FOR ORIYA LETTER WA - -0 > \u0a66; # FALLBACK FOR TAMIL -1 > \u0a67; +$consonant{\uE002→\u0A70; # SIGN TIPPI +\uE002→\u0A02; +\uE003→; # FALLBACK BLOW AWAY SIGN VISARGA +\uE004→ਅ; # FALLBACK TO LETTER A +\uE005→ਅ; # LETTER A +\uE006→ਆ; # LETTER AA +\uE007→ਇ; # LETTER I +\uE008→ਈ; # LETTER II +\uE009→ਉ; # LETTER U +\uE00A→ਊ; # LETTER UU +\uE00B→ਰਿ; # REMAP (indicExceptions.txt): \u0A0B→ਰਿ = LETTER VOCALIC R→LETTER RA.VOWEL SIGN I +\uE00C→ਲ਼; # FALLBACK +\uE00D→ਏ; # FALLBACK +\uE00E→ਏ; # FALLBACK +\uE00F→ਏ; # LETTER EE +\uE010→ਐ; # LETTER AI +\uE011→ਓ; # FALLBACK +\uE012→ਓ; # FALLBACK +\uE013→ਓ; # LETTER OO +\uE014→ਔ; # LETTER AU +\uE015→ਕ; # LETTER KA +\uE016→ਖ; # LETTER KHA +\uE017→ਗ; # LETTER GA +\uE018→ਘ; # LETTER GHA +\uE019→ਙ; # LETTER NGA +\uE01A→ਚ; # LETTER CA +\uE01B→ਛ; # LETTER CHA +\uE01C→ਜ; # LETTER JA +\uE01D→ਝ; # LETTER JHA +\uE01E→ਞ; # LETTER NYA +\uE01F→ਟ; # LETTER TTA +\uE020→ਠ; # LETTER TTHA +\uE021→ਡ; # LETTER DDA +\uE022→ਢ; # LETTER DDHA +\uE023→ਣ; # LETTER NNA +\uE024→ਤ; # LETTER TA +\uE025→ਥ; # LETTER THA +\uE026→ਦ; # LETTER DA +\uE027→ਧ; # LETTER DHA +\uE028→ਨ; # LETTER NA +\uE029→ਨ\u0A3C; # REMAP (indicExceptions.txt): \u0A29→ਨ = LETTER NNNA→LETTER NA +\uE02A→ਪ; # LETTER PA +\uE02B→ਫ; # LETTER PHA +\uE02C→ਬ; # LETTER BA +\uE02D→ਭ; # LETTER BHA +\uE02E→ਮ; # LETTER MA +\uE02F→ਯ; # LETTER YA +\uE030→ਰ; # LETTER RA +\uE031→ਰ\u0A3C; # FALLBACK LETTER RA+NUKTA +\uE032→ਲ; # LETTER LA +\uE033→ਲ; # LETTER LLA +\uE034→ਲ਼; # REMAP (indicExceptions.txt): \u0A34→ਲ਼ = LETTER LLLA→LETTER LLA +\uE035→ਵ; # LETTER VA +\uE036→ਸ਼; # LETTER SHA +\uE037→ਸ਼; # REMAP (indicExceptions.txt): \u0A37→ਸ਼ = LETTER SSA→LETTER SHA +\uE038→ਸ; # LETTER SA +\uE039→ਹ; # LETTER HA +\uE03C→\u0A3C; # SIGN NUKTA +\uE03D→; # FALLBACK BLOW AWAY SIGN AVAGRAHA +\uE03E→ਾ; # VOWEL SIGN AA +\uE03F→ਿ; # VOWEL SIGN I +\uE040→ੀ; # VOWEL SIGN II +\uE041→\u0A41; # VOWEL SIGN U +\uE042→\u0A42; # VOWEL SIGN UU +\uE043→; # FALLBACK BLOW AWAY VOWEL SIGN VOCALIC R +\uE044→; # FALLBACK BLOW AWAY VOWEL SIGN VOCALIC RR +\uE045→\u0A48; # REMAP (indicExceptions.txt): \u0A45→\u0A48 = VOWEL SIGN CANDRA E→VOWEL SIGN AI +\uE046→\u0A47; # FALLABCK +\uE047→\u0A47; # VOWEL SIGN EE +\uE048→\u0A48; # VOWEL SIGN AI +\uE049→\u0A4C; # REMAP (indicExceptions.txt): \u0A49→\u0A4C = VOWEL SIGN CANDRA O→VOWEL SIGN AU +\uE04A→\u0A4B; # FALLBACK +\uE04B→\u0A4B; # VOWEL SIGN OO +\uE04C→\u0A4C; # VOWEL SIGN AU +\uE04D→\u0A4D; # SIGN VIRAMA +\uE050→ਏ\u0A02; # FALLBACK to OO+BINDI : OM +\uE051→; +\uE052→; +\uE053→; +\uE054→; +\uE055→; # FALLBACK BLOW AWAY LENGTH MARK +\uE056→\u0A48; # REMAP (indicExceptions.txt): \u0A56→\u0A48 = AI LENGTH MARK→VOWEL SIGN AI +\uE057→\u0A4C; # REMAP (indicExceptions.txt): \u0A57→\u0A4C = AU LENGTH MARK→VOWEL SIGN AU +\uE058→ਕ\u0A3C; # FALLBACK RA+ NUKTA +\uE059→ਖ਼; # LETTER KHHA +\uE05A→ਗ਼; # LETTER GHHA +\uE05B→ਜ਼; # LETTER ZA +\uE05C→ੜ; # LETTER RRA +\uE05D→ਢ\u0A3C; # REMAP (indicExceptions.txt): \u0A5D→ਢ\u0A3C = LETTER RHA→LETTER DDHA.SIGN NUKTA +\uE05E→ਫ਼; # LETTER FA +\uE05F→ਯ\u0A3C; # REMAP (indicExceptions.txt): \u0A5F→ਯ = LETTER YYA→LETTER YA +\uE060→ਰਿ; # REMAP (indicExceptions.txt): \u0A60→ਰਿ = LETTER VOCALIC RR→LETTER RA.VOWEL SIGN I +\uE061→ਲ\u0A3C; # +\uE062→ਿ\u0A3C; # REMAP (indicExceptions.txt): \u0A62→ਿ\u0A3C = VOWEL SIGN VOCALIC L→VOWEL SIGN I.SIGN NUKTA +\uE063→ੀ\u0A3C; # REMAP (indicExceptions.txt): \u0A63→ੀ\u0A3C = VOWEL SIGN VOCALIC LL→VOWEL SIGN II.SIGN NUKTA +\uE064→।; # DANDA +\uE065→॥; # DOUBLE DANDA +\uE066→੦; # DIGIT ZERO +\uE067→੧; # DIGIT ONE +\uE068→੨; # DIGIT TWO +\uE069→੩; # DIGIT THREE +\uE06A→੪; # DIGIT FOUR +\uE06B→੫; # DIGIT FIVE +\uE06C→੬; # DIGIT SIX +\uE06D→੭; # DIGIT SEVEN +\uE06E→੮; # DIGIT EIGHT +\uE06F→੯; # DIGIT NINE +\uE070→; # ABBREVIATION SIGN +\uE071→ਰ; # LETTER RA WITH MIDDLE DIAGONAL +\uE072→ਰ; # LETTER RA WITH LOWER DIAGONAL +\uE073→; # RUPEE MARK +\uE074→; # RUPEE SIGN +\uE075→; # CURRENCY NUMERATOR ONE +\uE076→; # CURRENCY NUMERATOR TWO +\uE077→; # CURRENCY NUMERATOR THREE +\uE078→; # CURRENCY NUMERATOR FOUR +\uE079→; # CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR +\uE07A→; # CURRENCY DENOMINATOR SIXTEEN +\uE07B→; # ISSHAR +\uE07C→\u0A70; # TIPPI +\uE07D→\u0A71; # ADDAK +\uE07E→ੲ; # IRI +\uE07F→ੳ; # URA +\uE080→ੴ; # EK ONKAR +\uE081→ਵ; # FALLBACK FOR ORIYA LETTER WA +\uE082→; # Devanagari Glottal Stop +\uE083→ਤ\u0A4D; # Bengali Khanda-ta +0 → ੦; # FALLBACK FOR TAMIL +1 → ੧; # :: NFC (NFD) ; # eof +