_cyrillic_base.yml 3.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133
  1. general:
  2. name: Cyrillic base
  3. parents:
  4. - _ignore_base
  5. notes: >
  6. copied from Russian .cfg file and stripped
  7. off language-specific tokens. Russian ignore list
  8. has been left here on purpose, assuming it's valid
  9. for all child languages.
  10. roman_to_script:
  11. map:
  12. "A": "\u0410"
  13. "a": "\u0430"
  14. "B": "\u0411"
  15. "b": "\u0431"
  16. "V": "\u0412"
  17. "v": "\u0432"
  18. "D": "\u0414"
  19. "d": "\u0434"
  20. "E": "\u0415"
  21. "e": "\u0435"
  22. # this conversion shouldn't be needed, but does no harm
  23. "Z": "\u0417"
  24. "z": "\u0437"
  25. "I\u0306": "\u0419"
  26. # this conversion shouldn't be needed, but does no harm
  27. "I\uFE20U\uFE21": "\u042E"
  28. # this conversion shouldn't be needed, but does no harm
  29. "I\uFE20u\uFE21": "\u042E"
  30. "I\uFE20A\uFE21": "\u042F"
  31. # this conversion shouldn't be needed, but does no harm
  32. "I\uFE20a\uFE21": "\u042F"
  33. "i\u0306": "\u0439"
  34. "i\uFE20u\uFE21": "\u044E"
  35. "i\uFE20a\uFE21": "\u044F"
  36. # this conversion shouldn't be needed, but does no harm
  37. "KH": "\u0425"
  38. "Kh": "\u0425"
  39. "K": "\u041A"
  40. "kh": "\u0445"
  41. "k": "\u043A"
  42. "L": "\u041B"
  43. "l": "\u043B"
  44. "M": "\u041C"
  45. "m": "\u043C"
  46. "N": "\u041D"
  47. "n": "\u043D"
  48. "O": "\u041E"
  49. "o": "\u043E"
  50. "P": "\u041F"
  51. "p": "\u043F"
  52. "R": "\u0420"
  53. "r": "\u0440"
  54. # this conversion shouldn't be needed, but does no harm
  55. # this conversion shouldn't be needed, but does no harm
  56. "SH": "\u0428"
  57. "Sh": "\u0428"
  58. "S": "\u0421"
  59. "sh": "\u0448"
  60. "s": "\u0441"
  61. # this conversion shouldn't be needed, but does no harm
  62. "T": "\u0422"
  63. "t": "\u0442"
  64. "U": "\u0423"
  65. "u": "\u0443"
  66. "F": "\u0424"
  67. "f": "\u0444"
  68. # this conversion shouldn't be needed, but does no harm
  69. "CH": "\u0427"
  70. "Ch": "\u0427"
  71. "ch": "\u0447"
  72. # this conversion shouldn't be needed, but does no harm
  73. "\uFE20": ""
  74. # this conversion shouldn't be needed, but does no harm
  75. "\uFE21": ""
  76. # this conversion is ambiguous - \u042C is also theoretically possible
  77. "\u02B9": "\u044C"
  78. script_to_roman:
  79. map:
  80. "\u0404": "I\uFE20E\uFE21"
  81. "\u0407": "I\u0308"
  82. "\u0410": "A"
  83. "\u0411": "B"
  84. "\u0412": "V"
  85. "\u0414": "D"
  86. "\u0415": "E"
  87. "\u0417": "Z"
  88. "\u0419": "I\u0306"
  89. "\u041A": "K"
  90. "\u041B": "L"
  91. "\u041C": "M"
  92. "\u041D": "N"
  93. "\u041E": "O"
  94. "\u041F": "P"
  95. "\u0420": "R"
  96. "\u0421": "S"
  97. "\u0422": "T"
  98. "\u0423": "U"
  99. "\u0424": "F"
  100. "\u0425": "Kh"
  101. "\u0427": "Ch"
  102. "\u0428": "Sh"
  103. "\u0429": "Shch"
  104. "\u042C": "\u02B9"
  105. "\u042E": "I\uFE20U\uFE21"
  106. "\u042F": "I\uFE20A\uFE21"
  107. "\u0430": "a"
  108. "\u0431": "b"
  109. "\u0432": "v"
  110. "\u0434": "d"
  111. "\u0435": "e"
  112. "\u0437": "z"
  113. "\u0439": "i\u0306"
  114. "\u043A": "k"
  115. "\u043B": "l"
  116. "\u043C": "m"
  117. "\u043D": "n"
  118. "\u043E": "o"
  119. "\u043F": "p"
  120. "\u0440": "r"
  121. "\u0441": "s"
  122. "\u0442": "t"
  123. "\u0443": "u"
  124. "\u0444": "f"
  125. "\u0445": "kh"
  126. "\u0447": "ch"
  127. "\u0448": "sh"
  128. "\u0449": "shch"
  129. "\u044C": "\u02B9"
  130. "\u044E": "i\uFE20u\uFE21"
  131. "\u044F": "i\uFE20a\uFE21"