InterIndic_Arabic.txt (3497B)
1 # © 2016 and later: Unicode, Inc. and others. 2 # License & terms of use: http://www.unicode.org/copyright.html 3 # Generated using tools/cldr/cldr-to-icu/ 4 # 5 # File: InterIndic_Arabic.txt 6 # Generated from CLDR 7 # 8 9 $nonword = [^\uE000-\uE0FF]; 10 $wordBoundary = [^[:L:][:M:][:N:]]; 11 \uE015\uE03F\uE02F\uE03E } $nonword→كيا; # किया 12 \uE026\uE03F\uE02F\uE03E } $nonword→ديا; # दिया 13 \uE015\uE03F } $nonword→كي; # कि at word end 14 \uE039\uE048→هي; # ह\u0948 15 \uE001 } $nonword→ن; # chandrabindu at end to noon 16 \uE001→ن; # chandrabindu not at end to noon 17 \uE002 } $nonword→ن; # anusvara to noon at end 18 \uE002→ن; # anusvara to noon \u0902 19 \uE003→ه ا; # viarga to ha + alif ः 20 \uE004→ا; # short a to alif ऄ 21 \uE005→ا; # अ 22 \uE006→ا \u0653; # alif with mad आ 23 [[:L:][:M:]] {\uE007}→ي; # इ after another letter or mark 24 \uE007→إ; # इ at beginning of word 25 [[:L:][:M:]] {\uE008}→ي; # ई after another letter or mark 26 \uE008→إ; # ई at beginning of word 27 \uE009→و; # उ 28 \uE00A→و; # ऊ 29 \uE00B→ر; # ऋ 30 \uE00C→ل; # ऌ 31 \uE00D→ا ي; # ऍ 32 \uE00E→ي; # ऎ 33 $wordBoundary {\uE00F} → إي; # word-initial ए 34 \uE00F } $nonword→ي; # ए use ي when at end 35 \uE00F→ي; # ए use ي when not at end 36 \uE010 } $nonword→ا ي; # ऐ use ي when at end 37 \uE010→ا ي; # ऐ use ي when not at end 38 \uE011→ا و; # ऑ 39 \uE012→ا و; # ऒ 40 \uE013→ا و; # ओ 41 \uE014→ا و; # औ 42 \uE015→ك; # क 43 \uE016→كه; # ख 44 \uE017→ج; # ग 45 \uE018→جه; # घ 46 \uE019→نج; # ङ 47 \uE01A→تش; # च 48 \uE01B→تشه; # छ 49 \uE01C→ج; # ज 50 \uE01D→جه; # झ 51 \uE01E→ن; # ञ 52 \uE01F→ط; # ट 53 \uE020→طه; # ठ 54 \uE021→د; # ड 55 \uE022→ده; # ढ 56 \uE023→ن; # ण 57 \uE024→ت; # त 58 \uE025→ته; # थ 59 \uE026→د; # द 60 \uE027→ده; # ध 61 \uE028→ن; # न 62 \uE029→ن; # ऩ 63 \uE02A→ب; # प 64 \uE02B→به; # फ 65 \uE02C→ب; # ब 66 \uE02D→به; # भ 67 \uE02E→م; # म 68 \uE02F→ي; # य 69 \uE030→ر; # र 70 \uE031→ر; # ऱ 71 \uE032→ل; # ल 72 \uE033→ر; # ळ 73 \uE034→ر; # ऴ 74 \uE035→و; # व 75 \uE036→ش; # श 76 \uE037→ش; # ष 77 \uE038→س; # स 78 \uE039→ه; # ह 79 \uE03C→; # \u093C 80 \uE03D→; # ऽ 81 \uE03E→ا; # ा 82 \uE03F→ي; # ि 83 \uE040→ي; # ी 84 \uE041→و; # \u0941 85 \uE042→و; # \u0942 86 \uE043→ر; # \u0943 87 \uE044→ر; # \u0944 88 \uE045→ن; # \u0945 89 \uE046→ي; # \u0946 90 \uE047 } $nonword→ي; # \u0947 use ي when at end 91 \uE047→ي; # \u0947 use ي when not at end 92 \uE048 } $nonword→ا ي; # \u0948 use ي when at end 93 \uE048→ا ي; # \u0948 use ي when not at end 94 \uE049→و; # ॉ 95 \uE04A→ا و; # ॊ 96 \uE04B→و; # ो 97 \uE04C→ا و; # ौ 98 \uE04D→; # \u094D 99 \uE050→ا و; # ॐ 100 \uE051→; # \u0951 101 \uE052→; # \u0952 102 \uE053→; # \u0953 103 \uE054→; # \u0954 104 \uE058→ق; # क़ 105 \uE059→خ; # ख़ 106 \uE05A→غ; # ग़ 107 \uE05B→ز; # ज़ 108 \uE05C→ر; # ड़ 109 \uE05D→ره; # ढ़ 110 \uE05E→ف; # फ़ 111 \uE05F→ي; # य़ 112 \uE060→ر; # ॠ 113 \uE061→ل; # ॡ 114 \uE062→ل; # \u0962 115 \uE063→ل; # \u0963 116 \uE064→۔; # । 117 \uE065→۔; # ॥ 118 \uE066→\.; # ० 119 \uE067→١; # १ 120 \uE068→٢; # २ 121 \uE069→٣; # ३ 122 \uE06A→٤; # ४ 123 \uE06B→٥; # ५ 124 \uE06C→٦; # ६ 125 \uE06D→٧; # ७ 126 \uE06E→٨; # ८ 127 \uE06F→٩; # ९ 128 \uE070→\.; # ॰ 129 \uE082→; # ॽ 130 # Remove sequences of alif characters. 131 # For example, transform पाओला → بااولا → باولا. 132 ::null; 133 $alif = [أإآا] [:M:]*; 134 ($alif) $alif+ → $1;