church_slavonic.yml 5.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210
  1. general:
  2. name: Church Slavonic
  3. parents:
  4. - _cyrillic_base
  5. roman_to_script:
  6. map:
  7. # CONVERSION OF "I/i" LIGATED TO "A/a" (all capitalization patterns)
  8. "i\uFE20A\uFE21": "\u044F"
  9. "V\u0307": "\u0474"
  10. "v\u0307": "\u0475"
  11. "G\u0301": "\u0494"
  12. "g\u0301": "\u0495"
  13. "G": "\u0413"
  14. "g": "\u0433"
  15. # CONVERION OF "I/i" LIGATED TO "E/e", SOME WITH MACRON (0304) AND OGONEK (0328)
  16. "I\uFE20E\uFE21\u0304": "\u0464"
  17. "I\uFE20E\u0304\uFE21": "\u0464"
  18. "I\uFE20e\uFE21\u0304": "\u0464"
  19. "I\uFE20e\u0304\uFE21": "\u0464"
  20. "I\uFE20E\uFE21\u0328": "\u0468"
  21. "I\uFE20E\u0328\uFE21": "\u0468"
  22. "I\uFE20e\uFE21\u0328": "\u0468"
  23. "I\uFE20e\u0328\uFE21": "\u0468"
  24. "i\uFE20e\uFE21\u0304": "\u0465"
  25. "i\uFE20e\u0304\uFE21": "\u0465"
  26. "i\uFE20E\uFE21\u0304": "\u0465"
  27. "i\uFE20E\u0304\uFE21": "\u0465"
  28. "i\uFE20e\uFE21\u0328": "\u0469"
  29. "i\uFE20e\u0328\uFE21": "\u0469"
  30. "i\uFE20E\uFE21\u0328": "\u0469"
  31. "i\uFE20E\u0328\uFE21": "\u0469"
  32. "I\uFE20E\uFE21": "\u0462"
  33. "I\uFE20e\uFE21": "\u0462"
  34. "i\uFE20e\uFE21": "\u0463"
  35. "i\uFE20E\uFE21": "\u0463"
  36. # CONVERSION OF "E/e" WITH MACRON (0304), DOT ABOVE (0307), DIAERESIS (0308), OGONEK (0328), & CARON (030C)
  37. "E\u030C": "\u0462"
  38. "E\u0304": "\u0404"
  39. "E\u0307": "\u042D"
  40. "E\u0308": "\u0401"
  41. "E\u0328": "\u0466"
  42. "e\u030C": "\u0463"
  43. "e\u0304": "\u0454"
  44. "e\u0307": "\u044D"
  45. "e\u0308": "\u0451"
  46. "e\u0328": "\u0467"
  47. "ZH": "\u0416"
  48. "Zh": "\u0416"
  49. "zH": "\u0436"
  50. "zh": "\u0436"
  51. # CONVERION OF "I/i" LIGATED TO "O/o" WITH MACRON (0304) AND OGONEK (0328)
  52. "I\uFE20O\uFE21\u0328": "\u046C"
  53. "I\uFE20O\u0328\uFE21": "\u046C"
  54. "I\uFE20o\uFE21\u0328": "\u046C"
  55. "I\uFE20o\u0328\uFE21": "\u046C"
  56. "i\uFE20o\uFE21\u0328": "\u046D"
  57. "i\uFE20o\u0328\uFE21": "\u046D"
  58. "i\uFE20O\uFE21\u0328": "\u046D"
  59. "i\uFE20O\u0328\uFE21": "\u046D"
  60. # CONVERION OF "I/i" LIGATED TO "U/u"
  61. "i\uFE20U\uFE21": "\u044E"
  62. # CONVERSION OF "I/i" WITH MACRON (0304) AND BREVE (0306)
  63. "I\u0304": "\u0406"
  64. "i\u0304": "\u0456"
  65. # CONVERSION OF REMAINING LONE "I/i"
  66. "I": "\u0418"
  67. "i": "\u0438"
  68. "kH": "\u0445"
  69. "K\uFE20S\uFE21": "\u046E"
  70. "K\uFE20s\uFE21": "\u046E"
  71. "k\uFE20s\uFE21": "\u046F"
  72. "k\uFE20S\uFE21": "\u046F"
  73. # CONVERION OF "O/o" WITH OR WITHOUT MACRON (0304), LIGATED TO "T/t"
  74. "O\u0304\uFE20T\uFE21": "\u047E"
  75. "O\u0304\uFE20t\uFE21": "\u047E"
  76. "O\uFE20\u0304T\uFE21": "\u047E"
  77. "O\uFE20\u0304t\uFE21": "\u047E"
  78. "O\uFE20T\uFE21": "\u047E"
  79. "O\uFE20t\uFE21": "\u047E"
  80. "o\u0304\uFE20t\uFE21": "\u047F"
  81. "o\u0304\uFE20T\uFE21": "\u047F"
  82. "o\uFE20\u0304t\uFE21": "\u047F"
  83. "o\uFE20\u0304T\uFE21": "\u047F"
  84. "o\uFE20t\uFE21": "\u047F"
  85. "o\uFE20T\uFE21": "\u047F"
  86. # CONVERSION OF "O/o" WITH MACRON(0304) AND OGONEK (0328)
  87. "O\u0328": "\u046A"
  88. "o\u0328": "\u046B"
  89. "O\u0304": "\u0460"
  90. "o\u0304": "\u0461"
  91. "P\uFE20S\uFE21": "\u0470"
  92. "P\uFE20s\uFE21": "\u0470"
  93. "p\uFE20s\uFE21": "\u0471"
  94. "p\uFE20S\uFE21": "\u0471"
  95. "SHT": "\u0429"
  96. "SHt": "\u0429"
  97. "Sht": "\u0429"
  98. "sHT": "\u0449"
  99. "shT": "\u0449"
  100. "sht": "\u0449"
  101. "sH": "\u0448"
  102. "T\uFE20S\uFE21": "\u0426"
  103. "T\uFE20s\uFE21": "\u0426"
  104. "t\uFE20s\uFE21": "\u0446"
  105. "t\uFE20S\uFE21": "\u0446"
  106. "U\u0304": "\u0478"
  107. "u\u0304": "\u0479"
  108. "F\u0307": "\u0472"
  109. "f\u0307": "\u0473"
  110. "cH": "\u0447"
  111. "Y\u0307": "\u0476"
  112. "y\u0307": "\u0477"
  113. "Y": "\u042B"
  114. "y": "\u044B"
  115. # this conversion is ambiguous - \u042C is also theoretically possible
  116. "\u0027": "\u044C"
  117. # this conversion is ambiguous - \u044C is also theoretically possible
  118. "\u02BA": "\u044A"
  119. script_to_roman:
  120. map:
  121. # CONVERSION TO "I/i" LIGATED TO "A/a"
  122. "\u0474": "V\u0307"
  123. "\u0475": "v\u0307"
  124. "\u0494": "G\u0301"
  125. "\u0495": "g\u0301"
  126. "\u0413": "G"
  127. "\u0433": "g"
  128. # CONVERION TO "I/i" LIGATED TO "E/e" WITH DIACRITICS
  129. "\u0464": "I\uFE20E\uFE21\u0304"
  130. "\u0468": "I\uFE20E\uFE21\u0328"
  131. "\u0465": "i\uFE20e\uFE21\u0304"
  132. "\u0469": "i\uFE20e\uFE21\u0328"
  133. # CONVERSION TO "E/e" WITH MACRON (0304), DOT ABOVE (0307), DIAERESIS (0308), OGONEK (0328), & CARON (030C)
  134. "\u0462": "E\u030C"
  135. "\u0404": "E\u0304"
  136. "\u042D": "E\u0307"
  137. "\u0401": "E\u0308"
  138. "\u0466": "E\u0328"
  139. "\u0463": "e\u030C"
  140. "\u0454": "e\u0304"
  141. "\u044D": "e\u0307"
  142. "\u0451": "e\u0308"
  143. "\u0467": "e\u0328"
  144. "\u0416": "Zh"
  145. "\u0436": "zh"
  146. # CONVERION T0 "I/i" LIGATED TO "O/o" WITH MACRON (0304) AND OGONEK (0328)
  147. "\u046C": "I\uFE20O\uFE21\u0328"
  148. "\u046D": "i\uFE20o\uFE21\u0328"
  149. # CONVERION TO "I/i" LIGATED TO "U/u"
  150. # CONVERSION TO "I/i" WITH MACRON (0304) AND BREVE (0306)
  151. "\u0406": "I\u0304"
  152. "\u0456": "i\u0304"
  153. # CONVERSION TO LONE "I/i"
  154. "\u0418": "I"
  155. "\u0438": "i"
  156. "\u046E": "K\uFE20S\uFE21"
  157. "\u046F": "k\uFE20s\uFE21"
  158. # CONVERION TO "O/o" WITH MACRON (0304) LIGATED TO "T/t"
  159. "\u047E": "O\uFE20\u0304t\uFE21"
  160. "\u047F": "o\uFE20\u0304t\uFE21"
  161. # CONVERSION TO "O/o" WITH MACRON(0304) AND OGONEK (0328)
  162. "\u046A": "O\u0328"
  163. "\u046B": "o\u0328"
  164. "\u0460": "O\u0304"
  165. "\u0461": "o\u0304"
  166. # CONVERSION TO LONE "O/o"
  167. "\u0470": "P\uFE20S\uFE21"
  168. "\u0471": "p\uFE20s\uFE21"
  169. "\u0429": "Sht"
  170. "\u0449": "sht"
  171. "\u0426": "T\uFE20S\uFE21"
  172. "\u0446": "t\uFE20s\uFE21"
  173. "\u0478": "U\u0304"
  174. "\u0479": "u\u0304"
  175. "\u0472": "F\u0307"
  176. "\u0473": "f\u0307"
  177. "\u0476": "Y\u0307"
  178. "\u0477": "y\u0307"
  179. # Uppercase hard sign (ambiguously maps to one Latin character)
  180. "\u042A": "\u02BA"
  181. # Lowercase hard sign (ambiguously maps to one Latin character)
  182. "\u044A": "\u02BA"
  183. # Uppercase soft sign (ambiguously maps to one Latin character)
  184. # Lowercase soft sign (ambiguously maps to one Latin character)
  185. "\u042B": "Y"
  186. "\u044B": "y"