_cyrillic_base.yml 5.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268
  1. general:
  2. name: Cyrillic base
  3. notes: copied from Ukrainian .cfg file.
  4. roman_to_script:
  5. ignore:
  6. - "At head of title"
  7. - "Colophon"
  8. - "II"
  9. - "III"
  10. - "IV"
  11. - "IX"
  12. - "LI"
  13. - "LII"
  14. - "LIII"
  15. - "LIV"
  16. - "LIX"
  17. - "LV"
  18. - "LVI"
  19. - "LVII"
  20. - "LVIII"
  21. - "LX"
  22. - "LXI"
  23. - "LXII"
  24. - "LXIII"
  25. - "LXIV"
  26. - "LXIX"
  27. - "LXV"
  28. - "LXVI"
  29. - "LXVII"
  30. - "LXVIII"
  31. - "LXX"
  32. - "LXXI"
  33. - "LXXII"
  34. - "LXXIII"
  35. - "LXXIV"
  36. - "LXXIX"
  37. - "LXXV"
  38. - "LXXVI"
  39. - "LXXVII"
  40. - "LXXVIII"
  41. - "LXXX"
  42. - "LXXXI"
  43. - "LXXXII"
  44. - "LXXXIII"
  45. - "LXXXIV"
  46. - "LXXXIX"
  47. - "LXXXV"
  48. - "LXXXVI"
  49. - "LXXXVII"
  50. - "LXXXVIII"
  51. - "VI"
  52. - "VII"
  53. - "VIII"
  54. - "XI"
  55. - "XII"
  56. - "XIII"
  57. - "XIV"
  58. - "XIX"
  59. - "XL"
  60. - "XLI"
  61. - "XLII"
  62. - "XLIII"
  63. - "XLIV"
  64. - "XLIX"
  65. - "XLV"
  66. - "XLVI"
  67. - "XLVII"
  68. - "XLVIII"
  69. - "XV"
  70. - "XVI"
  71. - "XVII"
  72. - "XVIII"
  73. - "XX"
  74. - "XXI"
  75. - "XXII"
  76. - "XXIII"
  77. - "XXIV"
  78. - "XXIX"
  79. - "XXV"
  80. - "XXVI"
  81. - "XXVII"
  82. - "XXVIII"
  83. - "XXX"
  84. - "XXXI"
  85. - "XXXII"
  86. - "XXXIII"
  87. - "XXXIV"
  88. - "XXXIX"
  89. - "XXXV"
  90. - "XXXVI"
  91. - "XXXVII"
  92. - "XXXVIII"
  93. - "and one other"
  94. - "and two others"
  95. - "and three others"
  96. - "and four others"
  97. - "and five others"
  98. - "and six others"
  99. - "and seven others"
  100. - "and eight others"
  101. - "and nine others"
  102. - "and ten others"
  103. - "and eleven others"
  104. - "and twelve others"
  105. - "and thirteen others"
  106. - "and fourteen others"
  107. - "and fifteen others"
  108. - "and sixteen others"
  109. - "and seventeen others"
  110. - "and eighteen others"
  111. - "and nineteen others"
  112. - "and others"
  113. - "et al."
  114. - "date of publication not identified"
  115. - "Place of publication not identified"
  116. - "publisher not identified"
  117. map:
  118. "A": "\u0410"
  119. "a": "\u0430"
  120. "B": "\u0411"
  121. "b": "\u0431"
  122. "V": "\u0412"
  123. "v": "\u0432"
  124. "H": "\u0413"
  125. "h": "\u0433"
  126. "G": "\u0490"
  127. "g": "\u0491"
  128. "D": "\u0414"
  129. "d": "\u0434"
  130. "E": "\u0415"
  131. "e": "\u0435"
  132. "Z\uFE20H\uFE21": "\u0416"
  133. # this conversion shouldn't be needed, but does no harm
  134. "Z\uFE20h\uFE21": "\u0416"
  135. "Z": "\u0417"
  136. "z\uFE20h\uFE21": "\u0436"
  137. "z": "\u0437"
  138. "Y": "\u0418"
  139. "y": "\u0438"
  140. "I\u0306": "\u0419"
  141. "I\u0308": "\u0407"
  142. "I\uFE20E\uFE21": "\u0404"
  143. # this conversion shouldn't be needed, but does no harm
  144. "I\uFE20e\uFE21": "\u0404"
  145. "I\uFE20O\uFE21": "\u0401"
  146. # this conversion shouldn't be needed, but does no harm
  147. "I\uFE20o\uFE21": "\u0401"
  148. "I\uFE20U\uFE21": "\u042E"
  149. # this conversion shouldn't be needed, but does no harm
  150. "I\uFE20u\uFE21": "\u042E"
  151. "I\uFE20A\uFE21": "\u042F"
  152. # this conversion shouldn't be needed, but does no harm
  153. "I\uFE20a\uFE21": "\u042F"
  154. "I": "\u0406"
  155. "i\u0306": "\u0439"
  156. "i\u0308": "\u0457"
  157. "i\uFE20e\uFE21": "\u0454"
  158. "i\uFE20o\uFE21": "\u0451"
  159. "i\uFE20u\uFE21": "\u044E"
  160. "i\uFE20a\uFE21": "\u044F"
  161. "i": "\u0456"
  162. # this conversion shouldn't be needed, but does no harm
  163. "KH": "\u0425"
  164. "Kh": "\u0425"
  165. "K": "\u041A"
  166. "kh": "\u0445"
  167. "k": "\u043A"
  168. "L": "\u041B"
  169. "l": "\u043B"
  170. "M": "\u041C"
  171. "m": "\u043C"
  172. "N": "\u041D"
  173. "n": "\u043D"
  174. "O": "\u041E"
  175. "o": "\u043E"
  176. "P": "\u041F"
  177. "p": "\u043F"
  178. "R": "\u0420"
  179. "r": "\u0440"
  180. # this conversion shouldn't be needed, but does no harm
  181. "SHCH": "\u0429"
  182. "Shch": "\u0429"
  183. # this conversion shouldn't be needed, but does no harm
  184. "SH": "\u0428"
  185. "Sh": "\u0428"
  186. "S": "\u0421"
  187. "shch": "\u0449"
  188. "sh": "\u0448"
  189. "s": "\u0441"
  190. # this conversion shouldn't be needed, but does no harm
  191. "T\uFE20S\uFE21": "\u0426"
  192. # this conversion shouldn't be needed, but does no harm
  193. "T\uFE20s\uFE21": "\u0426"
  194. "T": "\u0422"
  195. "t\uFE20s\uFE21": "\u0446"
  196. "t": "\u0442"
  197. "U": "\u0423"
  198. "u": "\u0443"
  199. "F": "\u0424"
  200. "f": "\u0444"
  201. # this conversion shouldn't be needed, but does no harm
  202. "CH": "\u0427"
  203. "Ch": "\u0427"
  204. "ch": "\u0447"
  205. # this conversion shouldn't be needed, but does no harm
  206. "\uFE20": ""
  207. # this conversion shouldn't be needed, but does no harm
  208. "\uFE21": ""
  209. # this conversion is ambiguous - \u042C is also theoretically possible
  210. "\u02B9": "\u044C"
  211. script_to_roman:
  212. map:
  213. "\u0404": "I\uFE20E\uFE21"
  214. "\u0407": "I\u0308"
  215. "\u0410": "A"
  216. "\u0411": "B"
  217. "\u0412": "V"
  218. "\u0414": "D"
  219. "\u0415": "E"
  220. "\u0417": "Z"
  221. "\u0419": "I\u0306"
  222. "\u041A": "K"
  223. "\u041B": "L"
  224. "\u041C": "M"
  225. "\u041D": "N"
  226. "\u041E": "O"
  227. "\u041F": "P"
  228. "\u0420": "R"
  229. "\u0421": "S"
  230. "\u0422": "T"
  231. "\u0423": "U"
  232. "\u0424": "F"
  233. "\u0425": "Kh"
  234. "\u0427": "Ch"
  235. "\u0428": "Sh"
  236. "\u0429": "Shch"
  237. "\u042C": "\u02B9"
  238. "\u042E": "I\uFE20U\uFE21"
  239. "\u042F": "I\uFE20A\uFE21"
  240. "\u0430": "a"
  241. "\u0431": "b"
  242. "\u0432": "v"
  243. "\u0433": "h"
  244. "\u0434": "d"
  245. "\u0435": "e"
  246. "\u0437": "z"
  247. "\u0439": "i\u0306"
  248. "\u043A": "k"
  249. "\u043B": "l"
  250. "\u043C": "m"
  251. "\u043D": "n"
  252. "\u043E": "o"
  253. "\u043F": "p"
  254. "\u0440": "r"
  255. "\u0441": "s"
  256. "\u0442": "t"
  257. "\u0443": "u"
  258. "\u0444": "f"
  259. "\u0445": "kh"
  260. "\u0447": "ch"
  261. "\u0448": "sh"
  262. "\u0449": "shch"
  263. "\u044C": "\u02B9"
  264. "\u044E": "i\uFE20u\uFE21"
  265. "\u044F": "i\uFE20a\uFE21"