summaryrefslogtreecommitdiff
path: root/icu4c/source/data/translit/bg_bg_Latn_BGN.txt
diff options
context:
space:
mode:
Diffstat (limited to 'icu4c/source/data/translit/bg_bg_Latn_BGN.txt')
-rw-r--r--icu4c/source/data/translit/bg_bg_Latn_BGN.txt243
1 files changed, 243 insertions, 0 deletions
diff --git a/icu4c/source/data/translit/bg_bg_Latn_BGN.txt b/icu4c/source/data/translit/bg_bg_Latn_BGN.txt
new file mode 100644
index 000000000..d8351ce9b
--- /dev/null
+++ b/icu4c/source/data/translit/bg_bg_Latn_BGN.txt
@@ -0,0 +1,243 @@
+# © 2016 and later: Unicode, Inc. and others.
+# License & terms of use: http://www.unicode.org/copyright.html#License
+#
+# File: bg_bg_Latn_BGN.txt
+# Generated from CLDR
+#
+
+#
+########################################################################
+# BGN/PCGN 1952 System
+#
+# This system was adopted by the BGN in 1949 and by the PCGN in 1952.
+# It reflects the much simplified Bulgarian orthography as officially
+# revised in February 1945. The Bulgarian alphabet contains all of
+# the characters present in the Russian alphabet with the exception
+# of Ёё, Ыы, and Ээ. Two obsolete letters Ѫѫ and Ѣѣ are also given.
+#
+# The Bulgarian Alphabet as defined by the BGN (Page 15):
+#
+# АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢ
+# абвгдежзийклмнопрстуфхцчшщъьюяѫѣ
+#
+# Originally prepared by Michael Everson <everson@evertype.com>
+########################################################################
+#
+# MINIMAL FILTER: Bulgarian-Latin
+#
+:: [АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢабвгдежзийклмнопрстуфхцчшщъьюяѫѣ] ;
+:: NFD (NFC) ;
+#
+#
+########################################################################
+#
+########################################################################
+#
+# Define All Transformation Variables
+#
+########################################################################
+#
+$upperConsonants = [БВГДЖЗЙКЛМНПРСТФХЦЧШЩЬ] ;
+$lowerConsonants = [бвгджзйклмнпрстфхцчшщь] ;
+$consonants = [$upperConsonants $lowerConsonants] ;
+$upperVowels = [АЕИОУЪЮЯѪѢ] ;
+$lowerVowels = [аеиоуъюяѫѣ] ;
+$vowels = [$upperVowels $lowerVowels] ;
+$lower = [$lowerConsonants $lowerVowels] ;
+$bulgarian = [ $lower $upperConsonants $upperVowels ] ;
+#
+#
+# Use this $wordBoundary until bug 2034 is fixed in ICU:
+# http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
+#
+$wordBoundary = [^[:L:][:M:][:N:]] ;
+#
+#
+########################################################################
+#
+########################################################################
+#
+# Start of Alphabetic Transformations
+#
+########################################################################
+#
+А → A ; # CYRILLIC CAPITAL LETTER A
+а → a ; # CYRILLIC SMALL LETTER A
+Б → B ; # CYRILLIC CAPITAL LETTER BE
+б → b ; # CYRILLIC SMALL LETTER BE
+В → V ; # CYRILLIC CAPITAL LETTER VE
+в → v ; # CYRILLIC SMALL LETTER VE
+Г → G ; # CYRILLIC CAPITAL LETTER GHE
+г → g ; # CYRILLIC SMALL LETTER GHE
+Д → D ; # CYRILLIC CAPITAL LETTER DE
+д → d ; # CYRILLIC SMALL LETTER DE
+Е → E ; # CYRILLIC CAPITAL LETTER DE
+е → e ; # CYRILLIC SMALL LETTER DE
+Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE
+Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE
+ж → zh ; # CYRILLIC SMALL LETTER ZHE
+З → Z ; # CYRILLIC CAPITAL LETTER ZE
+з → z ; # CYRILLIC SMALL LETTER ZE
+И → I ; # CYRILLIC CAPITAL LETTER I
+и → i ; # CYRILLIC SMALL LETTER I
+Й → Y ; # CYRILLIC CAPITAL LETTER I
+й → y ; # CYRILLIC SMALL LETTER I
+К → K ; # CYRILLIC CAPITAL LETTER KA
+к → k ; # CYRILLIC SMALL LETTER KA
+Л → L ; # CYRILLIC CAPITAL LETTER EL
+л → l ; # CYRILLIC SMALL LETTER EL
+М → M ; # CYRILLIC CAPITAL LETTER EM
+м → m ; # CYRILLIC SMALL LETTER EM
+Н → N ; # CYRILLIC CAPITAL LETTER EN
+н → n ; # CYRILLIC SMALL LETTER EN
+О → O ; # CYRILLIC CAPITAL LETTER O
+о → o ; # CYRILLIC SMALL LETTER O
+П → P ; # CYRILLIC CAPITAL LETTER PE
+п → p ; # CYRILLIC SMALL LETTER PE
+Р → R ; # CYRILLIC CAPITAL LETTER ER
+р → r ; # CYRILLIC SMALL LETTER ER
+С → S ; # CYRILLIC CAPITAL LETTER ES
+с → s ; # CYRILLIC SMALL LETTER ES
+#
+#
+########################################################################
+#
+# BGN Page 16 Note 4
+#
+# тс becomes t·s
+#
+########################################################################
+#
+ТС → T·S ; # CYRILLIC CAPITAL LETTER TE
+Тс → T·s ; # CYRILLIC CAPITAL LETTER TE
+тс → t·s ; # CYRILLIC SMALL LETTER TE
+Т → T ; # CYRILLIC CAPITAL LETTER TE
+т → t ; # CYRILLIC SMALL LETTER TE
+#
+#
+########################################################################
+#
+# End Note 4
+#
+########################################################################
+У → U ; # CYRILLIC CAPITAL LETTER U
+у → u ; # CYRILLIC SMALL LETTER U
+Ф → F ; # CYRILLIC CAPITAL LETTER EF
+ф → f ; # CYRILLIC SMALL LETTER EF
+Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA
+Х → KH ; # CYRILLIC CAPITAL LETTER HA
+х → kh ; # CYRILLIC SMALL LETTER HA
+Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE
+Ц → TS ; # CYRILLIC CAPITAL LETTER TSE
+ц → ts ; # CYRILLIC SMALL LETTER TSE
+Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE
+Ч → CH ; # CYRILLIC CAPITAL LETTER CHE
+ч → ch ; # CYRILLIC SMALL LETTER CHE
+#
+########################################################################
+#
+# Implied rule from BGN Russian-Latin transliteration (Page 94 Note 3.6).
+#
+# шт becomes sh·t
+#
+########################################################################
+#
+ШТ → SH·T ; # CYRILLIC CAPITAL LETTER SHA
+Шт → Sh·t ; # CYRILLIC CAPITAL LETTER SHA
+шт → sh·t ; # CYRILLIC SMALL LETTER SHA
+Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA
+Ш → SH ; # CYRILLIC CAPITAL LETTER SHA
+ш → sh ; # CYRILLIC SMALL LETTER SHA
+Щ} $lower → Sht ; # CYRILLIC CAPITAL LETTER SHCHA
+Щ → SHT ; # CYRILLIC CAPITAL LETTER SHCHA
+щ → sht ; # CYRILLIC SMALL LETTER SHCHA
+#
+#
+########################################################################
+#
+# End Implied rule
+#
+########################################################################
+Ъ → Ŭ ; # CYRILLIC CAPITAL LETTER HARD SIGN
+ъ → ŭ ; # CYRILLIC SMALL LETTER HARD SIGN
+#
+########################################################################
+#
+# BGN Page 16 Note 1
+#
+# In modern Bulgarian orthography, the character ъ does not occur in
+# word-final position. It should be omitted in romanization when found
+# on older sources.
+#
+# The following rule removes all Ъъ at the end of a word. It is assumed
+# that when the condition is met, the text must be from an older source.
+# Comment out with a '#' at the start of a line to disable.
+#
+#
+########################################################################
+#
+$bulgarian { [Ъъ] } $wordBoundary > ;
+#
+#
+########################################################################
+#
+# End BGN Page 16 Note 1
+#
+########################################################################
+Ь → ’ ; # CYRILLIC CAPITAL LETTER SOFT SIGN
+ь → ’ ; # CYRILLIC SMALL LETTER SOFT SIGN
+Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU
+Ю → YU ; # CYRILLIC CAPITAL LETTER YU
+ю → yu ; # CYRILLIC SMALL LETTER YU
+Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA
+Я → YA ; # CYRILLIC CAPITAL LETTER YA
+я → ya ; # CYRILLIC SMALL LETTER YA
+#
+########################################################################
+#
+# BGN Page 16 Note 2
+#
+# The obsolete character Ѫ, which was replaced by Ъ in 1945, should be
+# romanized Ŭ.
+#
+########################################################################
+#
+Ѫ → Ŭ ; # CYRILLIC CAPITAL LETTER BIG YUS
+ѫ → ŭ ; # CYRILLIC SMALL LETTER BIG YUS
+#
+#
+########################################################################
+#
+# End BGN Page 16 Note 2
+#
+########################################################################
+#
+########################################################################
+#
+# BGN Page 16 Note 3
+#
+# The obsolete character Ѣ, replaced in 1945 by Я or Е according to local
+# pronunciation, should be romanized as e or ya, accordingly, if the
+# pronunciation is known; otherwise as ye.
+#
+########################################################################
+#
+Ѣ} $lower → Ye ; # CYRILLIC CAPITAL LETTER YAT
+Ѣ → YE ; # CYRILLIC CAPITAL LETTER YAT
+ѣ → ye ; # CYRILLIC SMALL LETTER YAT
+#
+#
+# Alternative rule where appropriate for local pronounciation. To apply
+# uncomment the following by removing the '#' mark at the start of the
+# line and insert before the three rule lines above.
+#
+# Ѣ} $lower → e ; # CYRILLIC CAPITAL LETTER YAT
+# Ѣ → E ; # CYRILLIC CAPITAL LETTER YAT
+# ѣ → e ; # CYRILLIC SMALL LETTER YAT
+#
+########################################################################
+#
+# End BGN Page 16 Note 3
+#
+########################################################################
+