bg_bg_Latn_BGN.txt (8514B)
1 # © 2016 and later: Unicode, Inc. and others. 2 # License & terms of use: http://www.unicode.org/copyright.html 3 # Generated using tools/cldr/cldr-to-icu/ 4 # 5 # File: bg_bg_Latn_BGN.txt 6 # Generated from CLDR 7 # 8 9 # 10 ######################################################################## 11 # BGN/PCGN 1952 System 12 # 13 # This system was adopted by the BGN in 1949 and by the PCGN in 1952. 14 # It reflects the much simplified Bulgarian orthography as officially 15 # revised in February 1945. The Bulgarian alphabet contains all of 16 # the characters present in the Russian alphabet with the exception 17 # of Ёё, Ыы, and Ээ. Two obsolete letters Ѫѫ and Ѣѣ are also given. 18 # 19 # The Bulgarian Alphabet as defined by the BGN (Page 15): 20 # 21 # АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢ 22 # абвгдежзийклмнопрстуфхцчшщъьюяѫѣ 23 # 24 # Originally prepared by Michael Everson <everson@evertype.com> 25 ######################################################################## 26 # 27 # MINIMAL FILTER: Bulgarian-Latin 28 # 29 :: [АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢабвгдежзийклмнопрстуфхцчшщъьюяѫѣ] ; 30 :: NFD (NFC) ; 31 # 32 # 33 ######################################################################## 34 # 35 ######################################################################## 36 # 37 # Define All Transformation Variables 38 # 39 ######################################################################## 40 # 41 $upperConsonants = [БВГДЖЗЙКЛМНПРСТФХЦЧШЩЬ] ; 42 $lowerConsonants = [бвгджзйклмнпрстфхцчшщь] ; 43 $consonants = [$upperConsonants $lowerConsonants] ; 44 $upperVowels = [АЕИОУЪЮЯѪѢ] ; 45 $lowerVowels = [аеиоуъюяѫѣ] ; 46 $vowels = [$upperVowels $lowerVowels] ; 47 $lower = [$lowerConsonants $lowerVowels] ; 48 $bulgarian = [ $lower $upperConsonants $upperVowels ] ; 49 # 50 # 51 # Use this $wordBoundary until bug 2034 is fixed in ICU: 52 # http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest 53 # 54 $wordBoundary = [^[:L:][:M:][:N:]] ; 55 # 56 # 57 ######################################################################## 58 # 59 ######################################################################## 60 # 61 # Start of Alphabetic Transformations 62 # 63 ######################################################################## 64 # 65 А → A ; # CYRILLIC CAPITAL LETTER A 66 а → a ; # CYRILLIC SMALL LETTER A 67 Б → B ; # CYRILLIC CAPITAL LETTER BE 68 б → b ; # CYRILLIC SMALL LETTER BE 69 В → V ; # CYRILLIC CAPITAL LETTER VE 70 в → v ; # CYRILLIC SMALL LETTER VE 71 Г → G ; # CYRILLIC CAPITAL LETTER GHE 72 г → g ; # CYRILLIC SMALL LETTER GHE 73 Д → D ; # CYRILLIC CAPITAL LETTER DE 74 д → d ; # CYRILLIC SMALL LETTER DE 75 Е → E ; # CYRILLIC CAPITAL LETTER DE 76 е → e ; # CYRILLIC SMALL LETTER DE 77 Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE 78 Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE 79 ж → zh ; # CYRILLIC SMALL LETTER ZHE 80 З → Z ; # CYRILLIC CAPITAL LETTER ZE 81 з → z ; # CYRILLIC SMALL LETTER ZE 82 И → I ; # CYRILLIC CAPITAL LETTER I 83 и → i ; # CYRILLIC SMALL LETTER I 84 Й → Y ; # CYRILLIC CAPITAL LETTER I 85 й → y ; # CYRILLIC SMALL LETTER I 86 К → K ; # CYRILLIC CAPITAL LETTER KA 87 к → k ; # CYRILLIC SMALL LETTER KA 88 Л → L ; # CYRILLIC CAPITAL LETTER EL 89 л → l ; # CYRILLIC SMALL LETTER EL 90 М → M ; # CYRILLIC CAPITAL LETTER EM 91 м → m ; # CYRILLIC SMALL LETTER EM 92 Н → N ; # CYRILLIC CAPITAL LETTER EN 93 н → n ; # CYRILLIC SMALL LETTER EN 94 О → O ; # CYRILLIC CAPITAL LETTER O 95 о → o ; # CYRILLIC SMALL LETTER O 96 П → P ; # CYRILLIC CAPITAL LETTER PE 97 п → p ; # CYRILLIC SMALL LETTER PE 98 Р → R ; # CYRILLIC CAPITAL LETTER ER 99 р → r ; # CYRILLIC SMALL LETTER ER 100 С → S ; # CYRILLIC CAPITAL LETTER ES 101 с → s ; # CYRILLIC SMALL LETTER ES 102 # 103 # 104 ######################################################################## 105 # 106 # BGN Page 16 Note 4 107 # 108 # тс becomes t·s 109 # 110 ######################################################################## 111 # 112 ТС → T·S ; # CYRILLIC CAPITAL LETTER TE 113 Тс → T·s ; # CYRILLIC CAPITAL LETTER TE 114 тс → t·s ; # CYRILLIC SMALL LETTER TE 115 Т → T ; # CYRILLIC CAPITAL LETTER TE 116 т → t ; # CYRILLIC SMALL LETTER TE 117 # 118 # 119 ######################################################################## 120 # 121 # End Note 4 122 # 123 ######################################################################## 124 У → U ; # CYRILLIC CAPITAL LETTER U 125 у → u ; # CYRILLIC SMALL LETTER U 126 Ф → F ; # CYRILLIC CAPITAL LETTER EF 127 ф → f ; # CYRILLIC SMALL LETTER EF 128 Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA 129 Х → KH ; # CYRILLIC CAPITAL LETTER HA 130 х → kh ; # CYRILLIC SMALL LETTER HA 131 Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE 132 Ц → TS ; # CYRILLIC CAPITAL LETTER TSE 133 ц → ts ; # CYRILLIC SMALL LETTER TSE 134 Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE 135 Ч → CH ; # CYRILLIC CAPITAL LETTER CHE 136 ч → ch ; # CYRILLIC SMALL LETTER CHE 137 # 138 ######################################################################## 139 # 140 # Implied rule from BGN Russian-Latin transliteration (Page 94 Note 3.6). 141 # 142 # шт becomes sh·t 143 # 144 ######################################################################## 145 # 146 ШТ → SH·T ; # CYRILLIC CAPITAL LETTER SHA 147 Шт → Sh·t ; # CYRILLIC CAPITAL LETTER SHA 148 шт → sh·t ; # CYRILLIC SMALL LETTER SHA 149 Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA 150 Ш → SH ; # CYRILLIC CAPITAL LETTER SHA 151 ш → sh ; # CYRILLIC SMALL LETTER SHA 152 Щ} $lower → Sht ; # CYRILLIC CAPITAL LETTER SHCHA 153 Щ → SHT ; # CYRILLIC CAPITAL LETTER SHCHA 154 щ → sht ; # CYRILLIC SMALL LETTER SHCHA 155 # 156 # 157 ######################################################################## 158 # 159 # End Implied rule 160 # 161 ######################################################################## 162 Ъ → Ŭ ; # CYRILLIC CAPITAL LETTER HARD SIGN 163 ъ → ŭ ; # CYRILLIC SMALL LETTER HARD SIGN 164 # 165 ######################################################################## 166 # 167 # BGN Page 16 Note 1 168 # 169 # In modern Bulgarian orthography, the character ъ does not occur in 170 # word-final position. It should be omitted in romanization when found 171 # on older sources. 172 # 173 # The following rule removes all Ъъ at the end of a word. It is assumed 174 # that when the condition is met, the text must be from an older source. 175 # Comment out with a '#' at the start of a line to disable. 176 # 177 # 178 ######################################################################## 179 # 180 $bulgarian { [Ъъ] } $wordBoundary > ; 181 # 182 # 183 ######################################################################## 184 # 185 # End BGN Page 16 Note 1 186 # 187 ######################################################################## 188 Ь → ’ ; # CYRILLIC CAPITAL LETTER SOFT SIGN 189 ь → ’ ; # CYRILLIC SMALL LETTER SOFT SIGN 190 Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU 191 Ю → YU ; # CYRILLIC CAPITAL LETTER YU 192 ю → yu ; # CYRILLIC SMALL LETTER YU 193 Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA 194 Я → YA ; # CYRILLIC CAPITAL LETTER YA 195 я → ya ; # CYRILLIC SMALL LETTER YA 196 # 197 ######################################################################## 198 # 199 # BGN Page 16 Note 2 200 # 201 # The obsolete character Ѫ, which was replaced by Ъ in 1945, should be 202 # romanized Ŭ. 203 # 204 ######################################################################## 205 # 206 Ѫ → Ŭ ; # CYRILLIC CAPITAL LETTER BIG YUS 207 ѫ → ŭ ; # CYRILLIC SMALL LETTER BIG YUS 208 # 209 # 210 ######################################################################## 211 # 212 # End BGN Page 16 Note 2 213 # 214 ######################################################################## 215 # 216 ######################################################################## 217 # 218 # BGN Page 16 Note 3 219 # 220 # The obsolete character Ѣ, replaced in 1945 by Я or Е according to local 221 # pronunciation, should be romanized as e or ya, accordingly, if the 222 # pronunciation is known; otherwise as ye. 223 # 224 ######################################################################## 225 # 226 Ѣ} $lower → Ye ; # CYRILLIC CAPITAL LETTER YAT 227 Ѣ → YE ; # CYRILLIC CAPITAL LETTER YAT 228 ѣ → ye ; # CYRILLIC SMALL LETTER YAT 229 # 230 # 231 # Alternative rule where appropriate for local pronunciation. To apply 232 # uncomment the following by removing the '#' mark at the start of the 233 # line and insert before the three rule lines above. 234 # 235 # Ѣ} $lower → e ; # CYRILLIC CAPITAL LETTER YAT 236 # Ѣ → E ; # CYRILLIC CAPITAL LETTER YAT 237 # ѣ → e ; # CYRILLIC SMALL LETTER YAT 238 # 239 ######################################################################## 240 # 241 # End BGN Page 16 Note 3 242 # 243 ########################################################################