RussianRomanization.cfg 7.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353
  1. # Original table by Gary L. Strawn
  2. # Updated by Hugh Taylor, 12 December 2006, 10.50 GMT
  3. # Added fields to FieldsIncluded 19 July 2007
  4. # Updated 30 May 2013 for RDA
  5. # Updated 15 Jan 2015 fixed incorrect i-kratkoe
  6. # Updated by Randall K. Barry, 14 February 2021, to add six Cyrillic characters used in Mongolian & Buriat
  7. # Updates by Randall K. Barry, 13 May 2022, to add Roman numeral conversion blocking
  8. [General]
  9. Name=Russian
  10. [RomanToScript]
  11. FieldsIncluded=100 110 111 130 240 245 246 250 260 264 440 490 600 610 611 630 651 700 710 711 730 740 800 830
  12. SubfieldsAlwaysExcluded=uvxy0123456789
  13. OtherSubfieldsExcludedByTag=100/e 110/e 111/j 246/i 260/c 264/c 650/a 700/e 700/i 710/e 710/i 711/i 711/j 730/i
  14. # RDA boilerplate phrases not transliterated:
  15. Place of publication not identified=Place of publication not identified
  16. publisher not identified=publisher not identified
  17. date of publication not identified=date of publication not identified
  18. At head of title=At head of title
  19. Colophon=Colophon
  20. and others=and others
  21. and one other=and one other
  22. and two others=and two others
  23. and three others=and three others
  24. and four others=and four others
  25. and five others=and five others
  26. and six others=and six others
  27. and seven others=and seven others
  28. and eight others=and eight others
  29. and nine others=and nine others
  30. and ten others=and ten others
  31. and eleven others=and eleven others
  32. and twelve others=and twelve others
  33. and thirteen others=and thirteen others
  34. and fourteen others=and fourteen others
  35. and fifteen others=and fifteen others
  36. and sixteen others=and sixteen others
  37. and seventeen others=and seventeen others
  38. and eighteen others=and eighteen others
  39. and nineteen others=and nineteen others
  40. et al.=et al.
  41. XLIX=XLIX
  42. XLIV=XLIV
  43. XLIII=XLIII
  44. XLII=XLII
  45. XLI=XLI
  46. XLVIII-XLVIII
  47. XLVII=XLVII
  48. XLVI=XLVI
  49. XLV=XLV
  50. XL=XL
  51. LXXXIX=LXXXIX
  52. LXXXIV=LXXXIV
  53. LXXXIII=LXXXIII
  54. LXXXII=LXXXII
  55. LXXXI=LXXXI
  56. LXXXVIII=LXXXVIII
  57. LXXXVII=LXXXVII
  58. LXXXVI=LXXXVI
  59. LXXXV=LXXXV
  60. LXXX=LXXX
  61. LXXIX=LXXIX
  62. LXXIV=LXXIV
  63. LXXIII=LXXIII
  64. LXXII=LXXII
  65. LXXI=LXXI
  66. LXXVIII=LXXVIII
  67. LXXVII=LXXVII
  68. LXXVI=LXXVI
  69. LXXV=LXXV
  70. LXX=LXX
  71. LXIX=XIX
  72. LXIV=LXIV
  73. LXIII=LXIII
  74. LXII=LXII
  75. LXI=LXI
  76. LXVIII=LXVIII
  77. LXVII=LXVII
  78. LXVI=LXVI
  79. LXV=LXV
  80. LX=LX
  81. LIX=LIX
  82. LIV=LIV
  83. LIII=LIII
  84. LII=LII
  85. LI=LI
  86. LVIII=LVIII
  87. LVII=LVII
  88. LVI=LVI
  89. LV=LV
  90. XXXIX=XXXIX
  91. XXXIV=XXXIV
  92. XXXIII=XXXIII
  93. XXXII=XXXII
  94. XXXI=XXXI
  95. XXXVIII=XXXVIII
  96. XXXVII=XXXVII
  97. XXXVI=XXXVI
  98. XXXV=XXXV
  99. XXX=XXX
  100. XXIX=XXIX
  101. XXIV=XXIV
  102. XXIII=XXIII
  103. XXII=XXII
  104. XXI=XXI
  105. XXVIII=XXVIII
  106. XXVII=XXVII
  107. XXVI=XXVI
  108. XXV=XXV
  109. XX=XX
  110. XIX=XIX
  111. XIV=XIV
  112. XIII=XIII
  113. XII=XII
  114. XI=XI
  115. XVIII=XVIII
  116. XVII=XVII
  117. XVI=XVI
  118. XV=XV
  119. IV=IV
  120. VIII=VIII
  121. VII=VII
  122. VI=VI
  123. IX=IX
  124. III=III
  125. II=II
  126. # COMMON COMBINING CHARACTERS (always follow a base letter):
  127. # combining macron U+0304
  128. # combining breve U+0306
  129. # combining dot above U+0307
  130. # combining diaeresis U+0308
  131. # combining left ligature U+FE20 (Cyrillic transliteration)
  132. # combining right ligature U+FE21 (Cyrillic transliteration)
  133. # soft sign/prime (spacing) U+02B9(Cyrillic transliteration)
  134. # hard sign/double prime (spacing) U+02BA (Cyrillic transliteration)
  135. A=U+0410
  136. a=U+0430
  137. B=U+0411
  138. b=U+0431
  139. V=U+0412
  140. v=U+0432
  141. G=U+0413
  142. g=U+0433
  143. D=U+0414
  144. d=U+0434
  145. EU+0307=U+042D
  146. EU+0308=U+0401
  147. # conversion results in a non-MARC-8 character
  148. EU+0328=U+0466
  149. E=U+0415
  150. eU+0307=U+044D
  151. eU+0308=U+0451
  152. # conversion results in a non-MARC-8 character
  153. eU+0328=U+0467
  154. e=U+0435
  155. # this conversion shouldn't be needed, but does no harm
  156. ZH=U+0416
  157. Zh=U+0416
  158. Z=U+0417
  159. zh=U+0436
  160. z=U+0437
  161. IU+0304=U+0406
  162. IU+0306=U+0419
  163. IU+FE20EU+FE21=U+0462
  164. # this conversion shouldn't be needed, but does no harm
  165. IU+FE20eU+FE21=U+0462
  166. IU+FE20UU+FE21=U+042E
  167. # this conversion shouldn't be needed, but does no harm
  168. IU+FE20uU+FE21=U+042E
  169. IU+FE20AU+FE21=U+042F
  170. # this conversion shouldn't be needed, but does no harm
  171. IU+FE20aU+FE21=U+042F
  172. I=U+0418
  173. iU+0304=U+0456
  174. iU+0306=U+0439
  175. iU+FE20eU+FE21=U+0463
  176. iU+FE20uU+FE21=U+044E
  177. iU+FE20aU+FE21=U+044F
  178. i=U+0438
  179. # this conversion shouldn't be needed, but does no harm
  180. KH=U+0425
  181. Kh=U+0425
  182. K=U+041A
  183. kh=U+0445
  184. k=U+043A
  185. L=U+041B
  186. l=U+043B
  187. M=U+041C
  188. m=U+043C
  189. N=U+041D
  190. n=U+043D
  191. # conversion results in a non-MARC-8 character
  192. OU+0307=U+04E8
  193. O=U+041E
  194. # conversion results in a non-MARC-8 character
  195. oU+0307=U+04E9
  196. o=U+043E
  197. P=U+041F
  198. p=U+043F
  199. R=U+0420
  200. r=U+0440
  201. # this conversion shouldn't be needed, but does no harm
  202. SHCH=U+0429
  203. Shch=U+0429
  204. # this conversion shouldn't be needed, but does no harm
  205. SH=U+0428
  206. Sh=U+0428
  207. S=U+0421
  208. shch=U+0449
  209. sh=U+0448
  210. s=U+0441
  211. TU+FE20SU+FE21=U+0426
  212. # this conversion shouldn't be needed, but does no harm
  213. TU+FE20sU+FE21=U+0426
  214. T=U+0422
  215. tU+FE20sU+FE21=U+0446
  216. t=U+0442
  217. # conversion results in a non-MARC-8 character
  218. UU+0307=U+04AE
  219. U=U+0423
  220. # conversion results in a non-MARC-8 character
  221. uU+0307=U+04AF
  222. u=U+0443
  223. FU+0307=U+0472
  224. F=U+0424
  225. fU+0307=U+0473
  226. f=U+0444
  227. # this conversion shouldn't be needed, but does no harm
  228. CH=U+0427
  229. Ch=U+0427
  230. ch=U+0447
  231. # conversion results in a non-MARC-8 character
  232. HU+0307=U+04BA
  233. # conversion results in a non-MARC-8 character
  234. hU+0307=U+04BB
  235. YU+0307=U+0474
  236. Y=U+042B
  237. yU+0307=U+0475
  238. y=U+044B
  239. # this conversion shouldn't be needed, but does no harm
  240. U+FE20=
  241. # this conversion shouldn't be needed, but does no harm
  242. U+FE21=
  243. # this conversion is ambiguous - U+042C is also theoretically possible
  244. U+0027=U+044C
  245. # this conversion is ambiguous - U+042C is also theoretically possible
  246. U+02B9=U+044C
  247. # this conversion is ambiguous - U+044C is also theoretically possible
  248. U+02BA=U+044A
  249. [ScriptToRoman]
  250. FieldsIncluded=100 110 111 130 240 245 246 250 260 264 440 490 600 610 611 630 651 700 710 711 730 740 800 830
  251. SubfieldsAlwaysExcluded=uvxy0123456789
  252. OtherSubfieldsExcludedByTag=100/e 110/e 111/j 246/i 260/c 264/c 650/a 700/e 700/i 710/e 710/i 711/i 711/j 730/i
  253. # RDA boilerplate phrases not transliterated:
  254. Place of publication not identified=Place of publication not identified
  255. publisher not identified=publisher not identified
  256. U+0401=EU+0308
  257. U+0451=eU+0308
  258. U+044C=U+02B9
  259. U+042C=U+02B9
  260. U+044A=U+02BA
  261. U+042A=U+02BA
  262. U+0410=A
  263. U+0430=a
  264. U+0411=B
  265. U+0431=b
  266. U+0412=V
  267. U+0432=v
  268. U+0413=G
  269. U+0433=g
  270. U+0414=D
  271. U+0434=d
  272. U+042D=EU+0307
  273. # this Unicode character shouldn't occur in MARC-8 data
  274. U+0466=EU+0328
  275. U+0415=E
  276. U+044D=eU+0307
  277. # this Unicode character shouldn't occur in MARC-8 data
  278. U+0467=eU+0328
  279. U+0435=e
  280. U+0416=Zh
  281. U+0417=Z
  282. U+0436=zh
  283. U+0437=z
  284. U+0406=IU+0304
  285. U+0419=IU+0306
  286. U+0462=IU+FE20EU+FE21
  287. U+042E=IU+FE20UU+FE21
  288. U+042F=IU+FE20AU+FE21
  289. U+0418=I
  290. U+0456=iU+0304
  291. U+0439=iU+0306
  292. U+0463=iU+FE20eU+FE21
  293. U+044E=iU+FE20uU+FE21
  294. U+044F=iU+FE20aU+FE21
  295. U+0438=i
  296. U+0425=Kh
  297. U+041A=K
  298. U+0445=kh
  299. U+043A=k
  300. U+041B=L
  301. U+043B=l
  302. U+041C=M
  303. U+043C=m
  304. U+041D=N
  305. U+043D=n
  306. # this Unicode character shouldn't occur in MARC-8 data
  307. U+04E8=OU+0307
  308. U+041E=O
  309. # this Unicode character shouldn't occur in MARC-8 data
  310. U+04E9=oU+0307
  311. U+043E=o
  312. U+041F=P
  313. U+043F=p
  314. U+0420=R
  315. U+0440=r
  316. U+0429=Shch
  317. U+0428=Sh
  318. U+0421=S
  319. U+0449=shch
  320. U+0448=sh
  321. U+0441=s
  322. U+0426=TU+FE20SU+FE21
  323. U+0422=T
  324. U+0446=tU+FE20sU+FE21
  325. U+0442=t
  326. # this Unicode character shouldn't occur in MARC-8 data
  327. U+04AE=UU+0307
  328. U+0423=U
  329. # this Unicode character shouldn't occur in MARC-8 data
  330. U+04AF=uU+0307
  331. U+0443=u
  332. U+0472=FU+0307
  333. U+0424=F
  334. U+0473=fU+0307
  335. U+0444=f
  336. U+0427=Ch
  337. # this Unicode character shouldn't occur in MARC-8 data
  338. U+04BA=HU+0307
  339. U+0447=ch
  340. # this Unicode character shouldn't occur in MARC-8 data
  341. U+04BB=hU+0307
  342. U+0474=YU+0307
  343. U+042B=Y
  344. U+0475=yU+0307
  345. U+044B=y