| # © 2016 and later: Unicode, Inc. and others. |
| # License & terms of use: http://www.unicode.org/copyright.html |
| # Generated using tools/cldr/cldr-to-icu/build-icu-data.xml |
| # |
| # File: InterIndic_Arabic.txt |
| # Generated from CLDR |
| # |
| |
| $nonword = [^\uE000-\uE0FF]; |
| $wordBoundary = [^[:L:][:M:][:N:]]; |
| \uE015\uE03F\uE02F\uE03E } $nonword→كيا; # किया |
| \uE026\uE03F\uE02F\uE03E } $nonword→ديا; # दिया |
| \uE015\uE03F } $nonword→كي; # कि at word end |
| \uE039\uE048→هي; # ह\u0948 |
| \uE001 } $nonword→ن; # chandrabindu at end to noon |
| \uE001→ن; # chandrabindu not at end to noon |
| \uE002 } $nonword→ن; # anusvara to noon at end |
| \uE002→ن; # anusvara to noon \u0902 |
| \uE003→ه ا; # viarga to ha + alif ः |
| \uE004→ا; # short a to alif ऄ |
| \uE005→ا; # अ |
| \uE006→ا \u0653; # alif with mad आ |
| [[:L:][:M:]] {\uE007}→ي; # इ after another letter or mark |
| \uE007→إ; # इ at beginning of word |
| [[:L:][:M:]] {\uE008}→ي; # ई after another letter or mark |
| \uE008→إ; # ई at beginning of word |
| \uE009→و; # उ |
| \uE00A→و; # ऊ |
| \uE00B→ر; # ऋ |
| \uE00C→ل; # ऌ |
| \uE00D→ا ي; # ऍ |
| \uE00E→ي; # ऎ |
| $wordBoundary {\uE00F} → إي; # word-initial ए |
| \uE00F } $nonword→ي; # ए use ي when at end |
| \uE00F→ي; # ए use ي when not at end |
| \uE010 } $nonword→ا ي; # ऐ use ي when at end |
| \uE010→ا ي; # ऐ use ي when not at end |
| \uE011→ا و; # ऑ |
| \uE012→ا و; # ऒ |
| \uE013→ا و; # ओ |
| \uE014→ا و; # औ |
| \uE015→ك; # क |
| \uE016→كه; # ख |
| \uE017→ج; # ग |
| \uE018→جه; # घ |
| \uE019→نج; # ङ |
| \uE01A→تش; # च |
| \uE01B→تشه; # छ |
| \uE01C→ج; # ज |
| \uE01D→جه; # झ |
| \uE01E→ن; # ञ |
| \uE01F→ط; # ट |
| \uE020→طه; # ठ |
| \uE021→د; # ड |
| \uE022→ده; # ढ |
| \uE023→ن; # ण |
| \uE024→ت; # त |
| \uE025→ته; # थ |
| \uE026→د; # द |
| \uE027→ده; # ध |
| \uE028→ن; # न |
| \uE029→ن; # ऩ |
| \uE02A→ب; # प |
| \uE02B→به; # फ |
| \uE02C→ب; # ब |
| \uE02D→به; # भ |
| \uE02E→م; # म |
| \uE02F→ي; # य |
| \uE030→ر; # र |
| \uE031→ر; # ऱ |
| \uE032→ل; # ल |
| \uE033→ر; # ळ |
| \uE034→ر; # ऴ |
| \uE035→و; # व |
| \uE036→ش; # श |
| \uE037→ش; # ष |
| \uE038→س; # स |
| \uE039→ه; # ह |
| \uE03C→; # \u093C |
| \uE03D→; # ऽ |
| \uE03E→ا; # ा |
| \uE03F→ي; # ि |
| \uE040→ي; # ी |
| \uE041→و; # \u0941 |
| \uE042→و; # \u0942 |
| \uE043→ر; # \u0943 |
| \uE044→ر; # \u0944 |
| \uE045→ن; # \u0945 |
| \uE046→ي; # \u0946 |
| \uE047 } $nonword→ي; # \u0947 use ي when at end |
| \uE047→ي; # \u0947 use ي when not at end |
| \uE048 } $nonword→ا ي; # \u0948 use ي when at end |
| \uE048→ا ي; # \u0948 use ي when not at end |
| \uE049→و; # ॉ |
| \uE04A→ا و; # ॊ |
| \uE04B→و; # ो |
| \uE04C→ا و; # ौ |
| \uE04D→; # \u094D |
| \uE050→ا و; # ॐ |
| \uE051→; # \u0951 |
| \uE052→; # \u0952 |
| \uE053→; # \u0953 |
| \uE054→; # \u0954 |
| \uE058→ق; # क़ |
| \uE059→خ; # ख़ |
| \uE05A→غ; # ग़ |
| \uE05B→ز; # ज़ |
| \uE05C→ر; # ड़ |
| \uE05D→ره; # ढ़ |
| \uE05E→ف; # फ़ |
| \uE05F→ي; # य़ |
| \uE060→ر; # ॠ |
| \uE061→ل; # ॡ |
| \uE062→ل; # \u0962 |
| \uE063→ل; # \u0963 |
| \uE064→۔; # । |
| \uE065→۔; # ॥ |
| \uE066→\.; # ० |
| \uE067→١; # १ |
| \uE068→٢; # २ |
| \uE069→٣; # ३ |
| \uE06A→٤; # ४ |
| \uE06B→٥; # ५ |
| \uE06C→٦; # ६ |
| \uE06D→٧; # ७ |
| \uE06E→٨; # ८ |
| \uE06F→٩; # ९ |
| \uE070→\.; # ॰ |
| \uE082→; # ॽ |
| # Remove sequences of alif characters. |
| # For example, transform पाओला → بااولا → باولا. |
| ::null; |
| $alif = [أإآا] [:M:]*; |
| ($alif) $alif+ → $1; |
| |