tor-browser

The Tor Browser
git clone https://git.dasho.dev/tor-browser.git
Log | Files | Refs | README | LICENSE

bg_bg_Latn_BGN.txt (8514B)


      1 # © 2016 and later: Unicode, Inc. and others.
      2 # License & terms of use: http://www.unicode.org/copyright.html
      3 # Generated using tools/cldr/cldr-to-icu/
      4 #
      5 # File: bg_bg_Latn_BGN.txt
      6 # Generated from CLDR
      7 #
      8 
      9 #
     10 ########################################################################
     11 # BGN/PCGN 1952 System
     12 #
     13 # This system was adopted by the BGN in 1949 and by the PCGN in 1952.
     14 # It reflects the much simplified Bulgarian orthography as officially
     15 # revised in February 1945. The Bulgarian alphabet contains all of
     16 # the characters present in the Russian alphabet with the exception
     17 # of Ёё, Ыы, and Ээ. Two obsolete letters Ѫѫ and Ѣѣ are also given.
     18 #
     19 # The Bulgarian Alphabet as defined by the BGN (Page 15):
     20 #
     21 #   АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢ
     22 #   абвгдежзийклмнопрстуфхцчшщъьюяѫѣ
     23 #
     24 # Originally prepared by Michael Everson <everson@evertype.com>
     25 ########################################################################
     26 #
     27 # MINIMAL FILTER: Bulgarian-Latin
     28 #
     29 :: [АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢабвгдежзийклмнопрстуфхцчшщъьюяѫѣ] ;
     30 :: NFD (NFC) ;
     31 #
     32 #
     33 ########################################################################
     34 #
     35 ########################################################################
     36 #
     37 # Define All Transformation Variables
     38 #
     39 ########################################################################
     40 #
     41 $upperConsonants = [БВГДЖЗЙКЛМНПРСТФХЦЧШЩЬ] ;
     42 $lowerConsonants = [бвгджзйклмнпрстфхцчшщь] ;
     43 $consonants = [$upperConsonants $lowerConsonants] ;
     44 $upperVowels = [АЕИОУЪЮЯѪѢ] ;
     45 $lowerVowels = [аеиоуъюяѫѣ] ;
     46 $vowels = [$upperVowels $lowerVowels] ;
     47 $lower = [$lowerConsonants $lowerVowels] ;
     48 $bulgarian = [ $lower $upperConsonants $upperVowels ] ;
     49 #
     50 #
     51 # Use this $wordBoundary until bug 2034 is fixed in ICU:
     52 # http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
     53 #
     54 $wordBoundary =  [^[:L:][:M:][:N:]] ;
     55 #
     56 #
     57 ########################################################################
     58 #
     59 ########################################################################
     60 #
     61 # Start of Alphabetic Transformations
     62 #
     63 ########################################################################
     64 #
     65 А → A ; # CYRILLIC CAPITAL LETTER A
     66 а → a ; # CYRILLIC SMALL LETTER A
     67 Б → B ; # CYRILLIC CAPITAL LETTER BE
     68 б → b ; # CYRILLIC SMALL LETTER BE
     69 В → V ; # CYRILLIC CAPITAL LETTER VE
     70 в → v ; # CYRILLIC SMALL LETTER VE
     71 Г → G ; # CYRILLIC CAPITAL LETTER GHE
     72 г → g ; # CYRILLIC SMALL LETTER GHE
     73 Д → D ; # CYRILLIC CAPITAL LETTER DE
     74 д → d ; # CYRILLIC SMALL LETTER DE
     75 Е → E ; # CYRILLIC CAPITAL LETTER DE
     76 е → e ; # CYRILLIC SMALL LETTER DE
     77 Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE
     78 Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE
     79 ж → zh ; # CYRILLIC SMALL LETTER ZHE
     80 З → Z ; # CYRILLIC CAPITAL LETTER ZE
     81 з → z ; # CYRILLIC SMALL LETTER ZE
     82 И → I ; # CYRILLIC CAPITAL LETTER I
     83 и → i ; # CYRILLIC SMALL LETTER I
     84 Й → Y ; # CYRILLIC CAPITAL LETTER I
     85 й → y ; # CYRILLIC SMALL LETTER I
     86 К → K ; # CYRILLIC CAPITAL LETTER KA
     87 к → k ; # CYRILLIC SMALL LETTER KA
     88 Л → L ; # CYRILLIC CAPITAL LETTER EL
     89 л → l ; # CYRILLIC SMALL LETTER EL
     90 М → M ; # CYRILLIC CAPITAL LETTER EM
     91 м → m ; # CYRILLIC SMALL LETTER EM
     92 Н → N ; # CYRILLIC CAPITAL LETTER EN
     93 н → n ; # CYRILLIC SMALL LETTER EN
     94 О → O ; # CYRILLIC CAPITAL LETTER O
     95 о → o ; # CYRILLIC SMALL LETTER O
     96 П → P ; # CYRILLIC CAPITAL LETTER PE
     97 п → p ; # CYRILLIC SMALL LETTER PE
     98 Р → R ; # CYRILLIC CAPITAL LETTER ER
     99 р → r ; # CYRILLIC SMALL LETTER ER
    100 С → S ; # CYRILLIC CAPITAL LETTER ES
    101 с → s ; # CYRILLIC SMALL LETTER ES
    102 #
    103 #
    104 ########################################################################
    105 #
    106 # BGN Page 16 Note 4
    107 #
    108 # тс becomes t·s
    109 #
    110 ########################################################################
    111 #
    112 ТС → T·S ; # CYRILLIC CAPITAL LETTER TE
    113 Тс → T·s ; # CYRILLIC CAPITAL LETTER TE
    114 тс → t·s ; # CYRILLIC SMALL LETTER TE
    115 Т → T ; # CYRILLIC CAPITAL LETTER TE
    116 т → t ; # CYRILLIC SMALL LETTER TE
    117 #
    118 #
    119 ########################################################################
    120 #
    121 # End Note 4
    122 #
    123 ########################################################################
    124 У → U ; # CYRILLIC CAPITAL LETTER U
    125 у → u ; # CYRILLIC SMALL LETTER U
    126 Ф → F ; # CYRILLIC CAPITAL LETTER EF
    127 ф → f ; # CYRILLIC SMALL LETTER EF
    128 Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA
    129 Х → KH ; # CYRILLIC CAPITAL LETTER HA
    130 х → kh ; # CYRILLIC SMALL LETTER HA
    131 Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE
    132 Ц → TS ; # CYRILLIC CAPITAL LETTER TSE
    133 ц → ts ; # CYRILLIC SMALL LETTER TSE
    134 Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE
    135 Ч → CH ; # CYRILLIC CAPITAL LETTER CHE
    136 ч → ch ; # CYRILLIC SMALL LETTER CHE
    137 #
    138 ########################################################################
    139 #
    140 # Implied rule from BGN Russian-Latin transliteration (Page 94 Note 3.6).
    141 #
    142 # шт becomes sh·t
    143 #
    144 ########################################################################
    145 #
    146 ШТ → SH·T ; # CYRILLIC CAPITAL LETTER SHA
    147 Шт → Sh·t ; # CYRILLIC CAPITAL LETTER SHA
    148 шт → sh·t ; # CYRILLIC SMALL LETTER SHA
    149 Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA
    150 Ш → SH ; # CYRILLIC CAPITAL LETTER SHA
    151 ш → sh ; # CYRILLIC SMALL LETTER SHA
    152 Щ} $lower → Sht ; # CYRILLIC CAPITAL LETTER SHCHA
    153 Щ → SHT ; # CYRILLIC CAPITAL LETTER SHCHA
    154 щ → sht ; # CYRILLIC SMALL LETTER SHCHA
    155 #
    156 #
    157 ########################################################################
    158 #
    159 # End Implied rule
    160 #
    161 ########################################################################
    162 Ъ → Ŭ ; # CYRILLIC CAPITAL LETTER HARD SIGN
    163 ъ → ŭ ; # CYRILLIC SMALL LETTER HARD SIGN
    164 #
    165 ########################################################################
    166 #
    167 # BGN Page 16 Note 1
    168 #
    169 # In modern Bulgarian orthography, the character ъ does not occur in
    170 # word-final position.  It should be omitted in romanization when found
    171 # on older sources.
    172 #
    173 # The following rule removes all Ъъ at the end of a word. It is assumed
    174 # that when the condition is met, the text must be from an older source.
    175 # Comment out with a '#' at the start of a line to disable.
    176 #
    177 #
    178 ########################################################################
    179 #
    180 $bulgarian { [Ъъ]  } $wordBoundary > ;
    181 #
    182 #
    183 ########################################################################
    184 #
    185 # End BGN Page 16 Note 1
    186 #
    187 ########################################################################
    188 Ь → ’ ; # CYRILLIC CAPITAL LETTER SOFT SIGN
    189 ь → ’ ; # CYRILLIC SMALL LETTER SOFT SIGN
    190 Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU
    191 Ю → YU ; # CYRILLIC CAPITAL LETTER YU
    192 ю → yu ; # CYRILLIC SMALL LETTER YU
    193 Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA
    194 Я → YA ; # CYRILLIC CAPITAL LETTER YA
    195 я → ya ; # CYRILLIC SMALL LETTER YA
    196 #
    197 ########################################################################
    198 #
    199 # BGN Page 16 Note 2
    200 #
    201 # The obsolete character Ѫ, which was replaced by Ъ in 1945, should be
    202 # romanized Ŭ.
    203 #
    204 ########################################################################
    205 #
    206 Ѫ → Ŭ ; # CYRILLIC CAPITAL LETTER BIG YUS
    207 ѫ → ŭ ; # CYRILLIC SMALL LETTER BIG YUS
    208 #
    209 #
    210 ########################################################################
    211 #
    212 # End BGN Page 16 Note 2
    213 #
    214 ########################################################################
    215 #
    216 ########################################################################
    217 #
    218 # BGN Page 16 Note 3
    219 #
    220 # The obsolete character Ѣ, replaced in 1945 by Я or Е according to local
    221 # pronunciation, should be romanized as e or ya, accordingly, if the
    222 # pronunciation is known; otherwise as ye.
    223 #
    224 ########################################################################
    225 #
    226 Ѣ} $lower → Ye ; # CYRILLIC CAPITAL LETTER YAT
    227 Ѣ → YE ; # CYRILLIC CAPITAL LETTER YAT
    228 ѣ → ye ; # CYRILLIC SMALL LETTER YAT
    229 #
    230 #
    231 # Alternative rule where appropriate for local pronunciation. To apply
    232 # uncomment the following by removing the '#' mark at the start of the
    233 # line and insert before the three rule lines above.
    234 #
    235 # Ѣ} $lower → e ; # CYRILLIC CAPITAL LETTER YAT
    236 # Ѣ → E ; # CYRILLIC CAPITAL LETTER YAT
    237 # ѣ → e ; # CYRILLIC SMALL LETTER YAT
    238 #
    239 ########################################################################
    240 #
    241 # End BGN Page 16 Note 3
    242 #
    243 ########################################################################