ar_ar_Latn_BGN.txt (7816B)
1 # © 2016 and later: Unicode, Inc. and others. 2 # License & terms of use: http://www.unicode.org/copyright.html 3 # Generated using tools/cldr/cldr-to-icu/ 4 # 5 # File: ar_ar_Latn_BGN.txt 6 # Generated from CLDR 7 # 8 9 # 10 ######################################################################## 11 # BGN/PCGN 1956 System 12 # 13 # This system was adopted by the BGN in 1946 and by the PCGN 14 # in 1956 and has been applied in the systematic romanization 15 # of geographic names in Bahrain, Egypt, Iraq, Jordan, 16 # Kuwait, Lebanon, Libya, Oman, Qatar, Saudi Arabia, Sudan, 17 # Syria, Tunisia, the United Arab Emirates, and Yemen, all 18 # of which has been covered by published BGN engineers. 19 # 20 # Originally prepared by Michael Everson <everson@evertype.com> 21 ######################################################################## 22 # 23 # MINIMAL FILTER: Arabic-Latin 24 # 25 :: [[:Arabic:][:Block=Arabic:][ءآابةتثجحخدذرزسشصضطظعغفقكلمنهوىي\u064B\u064C\u064D\u064E\u064F\u0650\u0651\u0652٠١٢٣٤٥٦٧٨٩ٱ]] ; 26 :: NFKD (NFC) ; 27 # 28 # 29 ######################################################################## 30 # 31 ######################################################################## 32 # 33 # Define All Transformation Variables 34 # 35 ######################################################################## 36 # 37 $alef = ’; 38 $ayin = ‘; 39 $disambig = \u0331 ; 40 # 41 # 42 # Use this $wordBoundary until bug 2034 is fixed in ICU: 43 # http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest 44 # 45 $wordBoundary = [^[:L:][:M:][:N:]] ; 46 # 47 # 48 ######################################################################## 49 # non-letters 50 [:Nd:]{٫}[:Nd:] ↔ [:Nd:]{','}[:Nd:] ; # ARABIC DECIMAL SEPARATOR 51 [:Nd:]{٬}[:Nd:] ↔ [:Nd:]{'.'}[:Nd:] ; # ARABIC THOUSANDS SEPARATOR 52 ٫ ↔ ',' $disambig ; # ARABIC DECIMAL SEPARATOR 53 ٬ ↔ '.' $disambig ; # ARABIC THOUSANDS SEPARATOR 54 # ٭ ↔ ; # ARABIC FIVE POINTED STAR // no need to transliterate 55 ، ↔ ',' ; # ARABIC COMMA 56 ؛ ↔ ';' ; # ARABIC SEMICOLON 57 ؟ ↔ '?' ; # ARABIC QUESTION MARK 58 ٪ ↔ '%' ; # ARABIC PERCENT SIGN 59 ۰ ↔ 0 $disambig ; # EXTENDED ARABIC-INDIC DIGIT ZERO 60 ۱ ↔ 1 $disambig ; # EXTENDED ARABIC-INDIC DIGIT ONE 61 ۲ ↔ 2 $disambig ; # EXTENDED ARABIC-INDIC DIGIT TWO 62 ۳ ↔ 3 $disambig ; # EXTENDED ARABIC-INDIC DIGIT THREE 63 ۴ ↔ 4 $disambig ; # EXTENDED ARABIC-INDIC DIGIT FOUR 64 ۵ ↔ 5 $disambig ; # EXTENDED ARABIC-INDIC DIGIT FIVE 65 ۶ ↔ 6 $disambig ; # EXTENDED ARABIC-INDIC DIGIT SIX 66 ۷ ↔ 7 $disambig ; # EXTENDED ARABIC-INDIC DIGIT SEVEN 67 ۸ ↔ 8 $disambig ; # EXTENDED ARABIC-INDIC DIGIT EIGHT 68 ۹ ↔ 9 $disambig ; # EXTENDED ARABIC-INDIC DIGIT NINE 69 ٠ ↔ 0 ; # ARABIC-INDIC DIGIT ZERO 70 ١ ↔ 1 ; # ARABIC-INDIC DIGIT ONE 71 ٢ ↔ 2 ; # ARABIC-INDIC DIGIT TWO 72 ٣ ↔ 3 ; # ARABIC-INDIC DIGIT THREE 73 ٤ ↔ 4 ; # ARABIC-INDIC DIGIT FOUR 74 ٥ ↔ 5 ; # ARABIC-INDIC DIGIT FIVE 75 ٦ ↔ 6 ; # ARABIC-INDIC DIGIT SIX 76 ٧ ↔ 7 ; # ARABIC-INDIC DIGIT SEVEN 77 ٨ ↔ 8 ; # ARABIC-INDIC DIGIT EIGHT 78 ٩ ↔ 9 ; # ARABIC-INDIC DIGIT NINE 79 # 80 ######################################################################## 81 # 82 # Rules moved to front to avoid masking 83 # 84 ######################################################################## 85 # 86 ######################################################################## 87 # 88 # BGN Page 8 Rule 5 89 # 90 # The character sequences ت , كه , ته , and سه may be romanized t·h, k·h, 91 # d·h, and s·h in order to differentiate those romanizations from the 92 # digraphs th, kh, dh, and sh. 93 # 94 ######################################################################## 95 # 96 ته → t·h ; # ARABIC LETTER TEH + HEH 97 كه → k·h ; # ARABIC LETTER KAF + HEH 98 ده → d·h ; # ARABIC LETTER DAL + HEH 99 سه → s·h ; # ARABIC LETTER SEEN + HEH 100 # 101 # 102 ######################################################################## 103 # 104 # End Rule 5 105 # 106 ######################################################################## 107 ######################################################################## 108 # 109 # 110 # BGN Page 8 Rule 9 111 # 112 # Doubles consonant sounds are represented in Arabic script by placing 113 # a shaddah ( \u0651 ) over a consonant character. In romanization the letter 114 # should be doubled. [The remainder of this rule deals with the definite 115 # article and is lexical.] 116 # 117 ######################################################################## 118 # 119 ب\u0651 → bb ; # ARABIC LETTER BEH + SHADDA 120 ت\u0651 → tt ; # ARABIC LETTER TEH + SHADDA 121 ث\u0651 → thth ; # ARABIC LETTER THEH + SHADDA 122 ج\u0651 → jj ; # ARABIC LETTER JEEM + SHADDA 123 ح\u0651 → ḥḥ ; # ARABIC LETTER HAH + SHADDA 124 خ\u0651 → khkh ; # ARABIC LETTER KHAH + SHADDA 125 د\u0651 → dd ; # ARABIC LETTER DAL + SHADDA 126 ذ\u0651 → dhdh ; # ARABIC LETTER THAL + SHADDA 127 ر\u0651 → rr ; # ARABIC LETTER REH + SHADDA 128 ز\u0651 → zz ; # ARABIC LETTER ZAIN + SHADDA 129 س\u0651 → ss ; # ARABIC LETTER SEEN + SHADDA 130 ش\u0651 → shsh ; # ARABIC LETTER SHEEN + SHADDA 131 ص\u0651 → ṣṣ ; # ARABIC LETTER SAD + SHADDA 132 ض\u0651 → ḍḍ ; # ARABIC LETTER DAD + SHADDA 133 ط\u0651 → ṭṭ ; # ARABIC LETTER TAH + SHADDA 134 ظ\u0651 → ẓẓ ; # ARABIC LETTER ZAH + SHADDA 135 ع\u0651 → $ayin $ayin ; # ARABIC LETTER AIN + SHADDA 136 غ\u0651 → ghgh ; # ARABIC LETTER GHAIN + SHADDA 137 ف\u0651 → ff ; # ARABIC LETTER FEH + SHADDA 138 ق\u0651 → qq ; # ARABIC LETTER QAF + SHADDA 139 ك\u0651 → kk ; # ARABIC LETTER KAF + SHADDA 140 ل\u0651 → ll ; # ARABIC LETTER LAM + SHADDA 141 م\u0651 → mm ; # ARABIC LETTER MEEM + SHADDA 142 ن\u0651 → nn ; # ARABIC LETTER NOON + SHADDA 143 ه\u0651 → hh ; # ARABIC LETTER HEH + SHADDA 144 و\u0651 → ww ; # ARABIC LETTER WAW + SHADDA 145 ى\u0651 → yy ; # ARABIC LETTER YEH + SHADDA 146 # 147 # 148 ######################################################################## 149 # 150 # End Rule 9 151 # 152 ######################################################################## 153 # 154 ######################################################################## 155 # 156 # Start of Transformations 157 # 158 ######################################################################## 159 # 160 $wordBoundary{ء → ; # ARABIC LETTER HAMZA 161 ء → $alef ; # ARABIC LETTER HAMZA 162 $wordBoundary{ا → ; # ARABIC LETTER ALEF 163 ٱ → $alef ; # ARABIC LETTER ALEF WASLA 164 $wordBoundary{آ → ā ; # ARABIC LETTER ALEF WITH MADDA ABOVE 165 آ → $alef ā ; # ARABIC LETTER ALEF WITH MADDA ABOVE 166 ب → b ; # ARABIC LETTER BEH 167 ت → t ; # ARABIC LETTER TEH 168 ة → h ; # ARABIC LETTER TEH MARBUTA 169 ث → th ; # ARABIC LETTER THEH 170 ج → j ; # ARABIC LETTER JEEM 171 ح → ḩ ; # ARABIC LETTER HAH 172 خ → kh ; # ARABIC LETTER KHAH 173 د → d ; # ARABIC LETTER DAL 174 ذ → dh ; # ARABIC LETTER THAL 175 ر → r ; # ARABIC LETTER REH 176 ز → z ; # ARABIC LETTER ZAIN 177 س → s ; # ARABIC LETTER SEEN 178 ش → sh ; # ARABIC LETTER SHEEN 179 ص → ş ; # ARABIC LETTER SAD 180 ض → ḑ ; # ARABIC LETTER DAD 181 ط → ţ ; # ARABIC LETTER TAH 182 ظ → z\u0327 ; # ARABIC LETTER ZAH 183 ع → $ayin ; # ARABIC LETTER AIN 184 غ → gh ; # ARABIC LETTER GHAIN 185 ف → f ; # ARABIC LETTER FEH 186 ق → q ; # ARABIC LETTER QAF 187 ک ↔ k $disambig ; # ARABIC LETTER KEHEH 188 ك ↔ k ; # ARABIC LETTER KAF 189 ل → l ; # ARABIC LETTER LAM 190 م → m ; # ARABIC LETTER MEEM 191 ن → n ; # ARABIC LETTER NOON 192 ه → h ; # ARABIC LETTER HEH 193 و → w ; # ARABIC LETTER WAW 194 ى → y ; # ARABIC LETTER YEH 195 \u064Eا → ā ; # ARABIC FATHA + ALEF 196 \u064Eى → á ; # ARABIC FATHA + ALEF MAKSURA 197 \u064Eي\u0652 → ay ; # ARABIC FATHA + YEH + SUKUN 198 \u064Eو\u0652 → aw ; # ARABIC FATHA + WAW + SUKUN 199 \u064E → a ; # ARABIC FATHA 200 \u0650ي → ī ; # ARABIC KASRA + YEH 201 \u0650 → i ; # ARABIC KASRA 202 \u064Fو → ū ; # ARABIC DAMMA + WAW 203 \u064F → u ; # ARABIC DAMMA 204 \u0652 → ; # ARABIC SUKUN 205 \u064B → aⁿ ; # ARABIC FATHATAN 206 \u064D → iⁿ ; # ARABIC KASRATAN 207 \u064C → uⁿ ; # ARABIC DAMMATAN 208 ::NFC (NFD) ; 209 # 210 # 211 ########################################################################