fa_fa_Latn_BGN.txt (7684B)
1 # © 2016 and later: Unicode, Inc. and others. 2 # License & terms of use: http://www.unicode.org/copyright.html 3 # Generated using tools/cldr/cldr-to-icu/ 4 # 5 # File: fa_fa_Latn_BGN.txt 6 # Generated from CLDR 7 # 8 9 # 10 ######################################################################## 11 # BGN/PCGN 1956 System 12 # 13 # This system was adopted by the BGN in 1946 and by the PCGN in 1958. 14 # It is used for the romanization of geographic names in Iran and 15 # for Persian-language names in Afghanistan. 16 # 17 # Originally prepared by Michael Everson <everson@evertype.com> 18 ######################################################################## 19 # 20 # MINIMAL FILTER: Persian-Latin 21 # 22 :: [[:Arabic:][:Block=Arabic:][ءآابةتثجحخدذرزسشصضطظعغفقكلمنهویي\u064E\u064F\u0650\u0651\u0652٠١٢٣٤٥٦٧٨٩پچژگی]] ; 23 :: NFKD (NFC) ; 24 # 25 # 26 ######################################################################## 27 # 28 ######################################################################## 29 # 30 # Define All Transformation Variables 31 # 32 ######################################################################## 33 # 34 $alef = ’; 35 $ayin = ‘; 36 $disambig = \u0331 ; 37 # 38 # 39 # Use this $wordBoundary until bug 2034 is fixed in ICU: 40 # http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest 41 # 42 $wordBoundary = [^[:L:][:M:][:N:]] ; 43 # 44 # 45 ######################################################################## 46 # non-letters 47 [:Nd:]{٫}[:Nd:] ↔ [:Nd:]{','}[:Nd:] ; # ARABIC DECIMAL SEPARATOR 48 [:Nd:]{٬}[:Nd:] ↔ [:Nd:]{'.'}[:Nd:] ; # ARABIC THOUSANDS SEPARATOR 49 ٫ ↔ ',' $disambig ; # ARABIC DECIMAL SEPARATOR 50 ٬ ↔ '.' $disambig ; # ARABIC THOUSANDS SEPARATOR 51 # ٭ ↔ ; # ARABIC FIVE POINTED STAR // no need to transliterate 52 ، ↔ ',' ; # ARABIC COMMA 53 ؛ ↔ ';' ; # ARABIC SEMICOLON 54 ؟ ↔ '?' ; # ARABIC QUESTION MARK 55 ٪ ↔ '%' ; # ARABIC PERCENT SIGN 56 ٠ ↔ 0 $disambig ; # ARABIC-INDIC DIGIT ZERO 57 ١ ↔ 1 $disambig ; # ARABIC-INDIC DIGIT ONE 58 ٢ ↔ 2 $disambig ; # ARABIC-INDIC DIGIT TWO 59 ٣ ↔ 3 $disambig ; # ARABIC-INDIC DIGIT THREE 60 ٤ ↔ 4 $disambig ; # ARABIC-INDIC DIGIT FOUR 61 ٥ ↔ 5 $disambig ; # ARABIC-INDIC DIGIT FIVE 62 ٦ ↔ 6 $disambig ; # ARABIC-INDIC DIGIT SIX 63 ٧ ↔ 7 $disambig ; # ARABIC-INDIC DIGIT SEVEN 64 ٨ ↔ 8 $disambig ; # ARABIC-INDIC DIGIT EIGHT 65 ٩ ↔ 9 $disambig ; # ARABIC-INDIC DIGIT NINE 66 ۰ ↔ 0 ; # EXTENDED ARABIC-INDIC DIGIT ZERO 67 ۱ ↔ 1 ; # EXTENDED ARABIC-INDIC DIGIT ONE 68 ۲ ↔ 2 ; # EXTENDED ARABIC-INDIC DIGIT TWO 69 ۳ ↔ 3 ; # EXTENDED ARABIC-INDIC DIGIT THREE 70 ۴ ↔ 4 ; # EXTENDED ARABIC-INDIC DIGIT FOUR 71 ۵ ↔ 5 ; # EXTENDED ARABIC-INDIC DIGIT FIVE 72 ۶ ↔ 6 ; # EXTENDED ARABIC-INDIC DIGIT SIX 73 ۷ ↔ 7 ; # EXTENDED ARABIC-INDIC DIGIT SEVEN 74 ۸ ↔ 8 ; # EXTENDED ARABIC-INDIC DIGIT EIGHT 75 ۹ ↔ 9 ; # EXTENDED ARABIC-INDIC DIGIT NINE 76 # 77 ######################################################################## 78 # 79 # Rules moved to front to avoid masking 80 # 81 ######################################################################## 82 # 83 ######################################################################## 84 # 85 # BGN Page 89 Rule 4 86 # 87 # The character sequences كه , زه , سه , and گه may be romanized k·h, z·h, 88 # s·h, and g·h in order to differentiate those romanizations from the 89 # digraphs kh, zh, sh, and gh. 90 # 91 ######################################################################## 92 # 93 كه → k·h ; # ARABIC LETTER KAF + HEH 94 زه → z·h ; # ARABIC LETTER ZAIN + HEH 95 سه → s·h ; # ARABIC LETTER SEEN + HEH 96 گه → g·h ; # ARABIC LETTER GAF + HEH 97 # 98 # 99 ######################################################################## 100 # 101 # End Rule 4 102 # 103 ######################################################################## 104 # 105 ######################################################################## 106 # 107 # BGN Page 91 Rule 7 108 # 109 # Doubles consonant sounds are represented in Arabic script by 110 # placing a shaddah ( \u0651 ) over a consonant character. In romanization 111 # the letter should be doubled. [The remainder of this rule deals with 112 # the definite article and is lexical.] 113 # 114 ######################################################################## 115 # 116 ب\u0651 → bb ; # ARABIC LETTER BEH + SHADDA 117 پ\u0651 → pp ; # ARABIC LETTER PEH + SHADDA 118 ت\u0651 → tt ; # ARABIC LETTER TEH + SHADDA 119 ث\u0651 → s\u0304s\u0304 ; # ARABIC LETTER THEH + SHADDA 120 ج\u0651 → jj ; # ARABIC LETTER JEEM + SHADDA 121 چ\u0651 → chch ; # ARABIC LETTER TCHEH + SHADDA 122 ح\u0651 → ḥḥ ; # ARABIC LETTER HAH + SHADDA 123 خ\u0651 → khkh ; # ARABIC LETTER KHAH + SHADDA 124 د\u0651 → dd ; # ARABIC LETTER DAL + SHADDA 125 ذ\u0651 → z\u0304z\u0304 ; # ARABIC LETTER THAL + SHADDA 126 ر\u0651 → rr ; # ARABIC LETTER REH + SHADDA 127 ز\u0651 → zz ; # ARABIC LETTER ZAIN + SHADDA 128 ژ\u0651 → zhzh ; # ARABIC LETTER JEH + SHADDA 129 س\u0651 → ss ; # ARABIC LETTER SEEN + SHADDA 130 ش\u0651 → shsh ; # ARABIC LETTER SHEEN + SHADDA 131 ص\u0651 → ṣṣ ; # ARABIC LETTER SAD + SHADDA 132 ض\u0651 → ḍḍ ; # ARABIC LETTER DAD + SHADDA 133 ط\u0651 → ṭṭ ; # ARABIC LETTER TAH + SHADDA 134 ظ\u0651 → ẓẓ ; # ARABIC LETTER ZAH + SHADDA 135 ع\u0651 → $ayin $ayin ; # ARABIC LETTER AIN + SHADDA 136 غ\u0651 → ghgh ; # ARABIC LETTER GHAIN + SHADDA 137 ف\u0651 → ff ; # ARABIC LETTER FEH + SHADDA 138 ق\u0651 → qq ; # ARABIC LETTER QAF + SHADDA 139 ك\u0651 → kk ; # ARABIC LETTER KAF + SHADDA 140 ل\u0651 → ll ; # ARABIC LETTER LAM + SHADDA 141 م\u0651 → mm ; # ARABIC LETTER MEEM + SHADDA 142 ن\u0651 → nn ; # ARABIC LETTER NOON + SHADDA 143 ه\u0651 → hh ; # ARABIC LETTER HEH + SHADDA 144 و\u0651 → ww ; # ARABIC LETTER WAW + SHADDA 145 ی\u0651 → yy ; # ARABIC LETTER FARSI YEH + SHADDA 146 # 147 # 148 ######################################################################## 149 # 150 # End Rule 7 151 # 152 ######################################################################## 153 # 154 ######################################################################## 155 # 156 # Start of Transformations 157 # 158 ######################################################################## 159 # 160 $wordBoundary{ء → ; # ARABIC LETTER HAMZA 161 ء → $alef ; # ARABIC LETTER HAMZA 162 $wordBoundary{ا → ; # ARABIC LETTER ALEF 163 آ → $alef ā ; # ARABIC FATHA ALEF WITH MADDA ABOVE 164 ب → b ; # ARABIC LETTER BEH 165 پ → p ; # ARABIC LETTER PEH 166 ت → t ; # ARABIC LETTER TEH 167 ة → h ; # ARABIC LETTER TEH MARBUTA 168 ث → s\u0304 ; # ARABIC LETTER THEH 169 ج → j ; # ARABIC LETTER JEEM 170 چ → ch ; # ARABIC LETTER TCHEH 171 ح → ḥ ; # ARABIC LETTER HAH 172 خ → kh ; # ARABIC LETTER KHAH 173 د → d ; # ARABIC LETTER DAL 174 ذ → z\u0304 ; # ARABIC LETTER THAL 175 ر → r ; # ARABIC LETTER REH 176 ز → z ; # ARABIC LETTER ZAIN 177 ژ → zh ; # ARABIC LETTER JEH 178 س → s ; # ARABIC LETTER SEEN 179 ش → sh ; # ARABIC LETTER SHEEN 180 ص → ṣ ; # ARABIC LETTER SAD 181 ض → ẕ ; # ARABIC LETTER DAD 182 ط → ṭ ; # ARABIC LETTER TAH 183 ظ → ẓ ; # ARABIC LETTER ZAH 184 ع → $ayin ; # ARABIC LETTER AIN 185 غ → gh ; # ARABIC LETTER GHAIN 186 ف → f ; # ARABIC LETTER FEH 187 ق → q ; # ARABIC LETTER QAF 188 ک ↔ k ; # ARABIC LETTER KEHEH 189 ك ↔ k $disambig ; # ARABIC LETTER KAF 190 گ → g ; # ARABIC LETTER GAF 191 ل → l ; # ARABIC LETTER LAM 192 م → m ; # ARABIC LETTER MEEM 193 ن → n ; # ARABIC LETTER NOON 194 ه → h ; # ARABIC LETTER HEH 195 و → v ; # ARABIC LETTER WAW 196 ی → y ; # ARABIC LETTER FARSI YEH 197 \u064Eا → ā ; # ARABIC FATHA + ALEF 198 \u064Eی → á ; # ARABIC FATHA + FARSI YEH 199 \u064Eو\u0652 → ow ; # ARABIC FATHA + WAW + SUKUN 200 \u064E → a ; # ARABIC FATHA 201 \u0650ي → ī ; # ARABIC KASRA + YEH 202 \u0650 → e ; # ARABIC KASRA 203 \u064Fو → ū ; # ARABIC DAMMA + WAW 204 \u064F → o ; # ARABIC DAMMA 205 \u0652 → ; # ARABIC SUKUN 206 ::NFC (NFD) ; 207 # 208 # 209 ########################################################################