MongolianRomanization.cfg 7.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375
  1. # Original table by Randall K. Barry, 14 February 2021
  2. # Revised by Randall K. Barry to correct "ng" conversion, 10 August 2021
  3. # Revised by Randall K. Barry to correct "e+dot" conversion, 18 August 2021
  4. # Revised by Randall K. Barry to correct "-e" (non-joining "e") conversion, 19 November 2021
  5. # Revised by Randall K. Barry to add roman numeral handling, 13 May 2022
  6. [General]
  7. Name=Mongolian
  8. # UNICODE MONGOLIAN CHARACTER RANGE: U+1800-U+18AF
  9. [RomanToScript]
  10. FieldsIncluded=100 110 111 130 240 245 246 250 260 264 440 490 600 610 611 630 651 700 710 711 730 740 800 830
  11. SubfieldsAlwaysExcluded=uvxy0123456789
  12. OtherSubfieldsExcludedByTag=100/e 110/e 111/j 246/i 260/c 264/c 650/a 700/e 700/i 710/e 710/i 711/i 711/j 730/i
  13. # RDA boilerplate phrases not transliterated:
  14. Place of publication not identified=Place of publication not identified
  15. publisher not identified=publisher not identified
  16. date of publication not identified=date of publication not identified
  17. At head of title=At head of title
  18. Colophon=Colophon
  19. and others=and others
  20. and one other=and one other
  21. and two others=and two others
  22. and three others=and three others
  23. and four others=and four others
  24. and five others=and five others
  25. and six others=and six others
  26. and seven others=and seven others
  27. and eight others=and eight others
  28. and nine others=and nine others
  29. and ten others=and ten others
  30. and eleven others=and eleven others
  31. and twelve others=and twelve others
  32. and thirteen others=and thirteen others
  33. and fourteen others=and fourteen others
  34. and fifteen others=and fifteen others
  35. and sixteen others=and sixteen others
  36. and seventeen others=and seventeen others
  37. and eighteen others=and eighteen others
  38. and nineteen others=and nineteen others
  39. et al.=et al.
  40. XLIX=XLIX
  41. XLIV=XLIV
  42. XLIII=XLIII
  43. XLII=XLII
  44. XLI=XLI
  45. XLVIII-XLVIII
  46. XLVII=XLVII
  47. XLVI=XLVI
  48. XLV=XLV
  49. XL=XL
  50. LXXXIX=LXXXIX
  51. LXXXIV=LXXXIV
  52. LXXXIII=LXXXIII
  53. LXXXII=LXXXII
  54. LXXXI=LXXXI
  55. LXXXVIII=LXXXVIII
  56. LXXXVII=LXXXVII
  57. LXXXVI=LXXXVI
  58. LXXXV=LXXXV
  59. LXXX=LXXX
  60. LXXIX=LXXIX
  61. LXXIV=LXXIV
  62. LXXIII=LXXIII
  63. LXXII=LXXII
  64. LXXI=LXXI
  65. LXXVIII=LXXVIII
  66. LXXVII=LXXVII
  67. LXXVI=LXXVI
  68. LXXV=LXXV
  69. LXX=LXX
  70. LXIX=XIX
  71. LXIV=LXIV
  72. LXIII=LXIII
  73. LXII=LXII
  74. LXI=LXI
  75. LXVIII=LXVIII
  76. LXVII=LXVII
  77. LXVI=LXVI
  78. LXV=LXV
  79. LX=LX
  80. LIX=LIX
  81. LIV=LIV
  82. LIII=LIII
  83. LII=LII
  84. LI=LI
  85. LVIII=LVIII
  86. LVII=LVII
  87. LVI=LVI
  88. LV=LV
  89. XXXIX=XXXIX
  90. XXXIV=XXXIV
  91. XXXIII=XXXIII
  92. XXXII=XXXII
  93. XXXI=XXXI
  94. XXXVIII=XXXVIII
  95. XXXVII=XXXVII
  96. XXXVI=XXXVI
  97. XXXV=XXXV
  98. XXX=XXX
  99. XXIX=XXIX
  100. XXIV=XXIV
  101. XXIII=XXIII
  102. XXII=XXII
  103. XXI=XXI
  104. XXVIII=XXVIII
  105. XXVII=XXVII
  106. XXVI=XXVI
  107. XXV=XXV
  108. XX=XX
  109. XIX=XIX
  110. XIV=XIV
  111. XIII=XIII
  112. XII=XII
  113. XI=XI
  114. XVIII=XVIII
  115. XVII=XVII
  116. XVI=XVI
  117. XV=XV
  118. IV=IV
  119. VIII=VIII
  120. VII=VII
  121. VI=VI
  122. IX=IX
  123. III=III
  124. II=II
  125. # COMMON COMBINING AND SPECIAL CHARACTERS USED WITH MONGOLIAN SCRIPT:
  126. # hyphen (spacing) U+002D
  127. # combining acute U+0301
  128. # combining dot above U+0307
  129. # combining tilde U+0303
  130. # combining macron U+0304
  131. # combining dot below U+0323
  132. # combining ring below U+0325
  133. # Mongolian vowel separator (spacing) U+180E
  134. # narrow no-break space U+202F
  135. U+002DA=U+180EU+1820
  136. U+002Da=U+180EU+1820
  137. A=U+1820
  138. a=U+1820
  139. U+002DE=U+180EU+1821
  140. U+002De=U+180EU+1821
  141. U+002D=U+202F
  142. EU+0307=U+1827
  143. eU+0307=U+1827
  144. E=U+1821
  145. e=U+1821
  146. I=U+1822
  147. i=U+1822
  148. OU+0307=U+1825
  149. oU+0307=U+1825
  150. O=U+1823
  151. o=U+1823
  152. UU+0307=U+1826
  153. uU+0307=U+1826
  154. U=U+1824
  155. u=U+1824
  156. NG=U+1829
  157. # this conversion shouldn't be needed, but does no harm
  158. nG=U+1829
  159. ng=U+1829
  160. N=U+1828
  161. n=U+1828
  162. B=U+182A
  163. b=U+182A
  164. P=U+182B
  165. p=U+182B
  166. Q=U+182C
  167. q=U+182C
  168. KH=U+183B
  169. Kh=U+183B
  170. # this conversion shouldn't be needed, but does no harm
  171. kH=U+183B
  172. kh=U+183B
  173. KU+0307=U+183A
  174. kU+0307=U+183A
  175. K=U+182C
  176. k=U+182C
  177. GU+0307=U+182D
  178. gU+0307=U+182D
  179. G=U+182D
  180. g=U+182D
  181. M=U+182E
  182. m=U+182E
  183. LH=U+1840
  184. Lh=U+1840
  185. # this conversion shouldn't be needed, but does no harm
  186. lH=U+1840
  187. lh=U+1840
  188. L=U+182F
  189. l=U+182F
  190. TSU+0307=U+183C
  191. # this conversion shouldn't be needed, but does no harm
  192. TsU+0307=U+183C
  193. # this conversion shouldn't be needed, but does no harm
  194. tSU+0307=U+183C
  195. tsU+0307=U+183C
  196. SU+0301=U+1831
  197. sU+0301=U+1831
  198. S=U+1830
  199. s=U+1830
  200. T=U+1832
  201. t=U+1832
  202. D=U+1833
  203. d=U+1833
  204. C=U+1834
  205. c=U+1834
  206. J=U+1835
  207. j=U+1835
  208. Y=U+1836
  209. y=U+1836
  210. R=U+1837
  211. r=U+1837
  212. V=U+1838
  213. v=U+1838
  214. W=U+1838
  215. w=U+1838
  216. F=U+1839
  217. f=U+1839
  218. ZR=U+183F
  219. # this conversion shouldn't be needed, but does no harm
  220. Zr=U+183F
  221. # this conversion shouldn't be needed, but does no harm
  222. zR=U+183F
  223. zr=U+183F
  224. ZH=U+1841
  225. Zh=U+1841
  226. # this conversion shouldn't be needed, but does no harm
  227. zH=U+1841
  228. zh=U+1841
  229. CH=U+1842
  230. Ch=U+1842
  231. # this conversion shouldn't be needed, but does no harm
  232. cH=U+1842
  233. ch=U+1842
  234. H=U+183E
  235. h=U+183E
  236. -=U+180E
  237. [ScriptToRoman]
  238. FieldsIncluded=100 110 111 130 240 245 246 250 260 264 440 490 600 610 611 630 651 700 710 711 730 740 800 830
  239. SubfieldsAlwaysExcluded=uvxy0123456789
  240. OtherSubfieldsExcludedByTag=100/e 110/e 111/j 246/i 260/c 264/c 650/a 700/e 700/i 710/e 710/i 711/i 711/j 730/i
  241. # RDA boilerplate phrases not transliterated:
  242. Place of publication not identified=Place of publication not identified
  243. publisher not identified=publisher not identified
  244. date of publication not identified=date of publication not identified
  245. At head of title=At head of title
  246. # g followed by vowel a
  247. U+182DU+1820=gU+0307a
  248. # g followed by vowel o
  249. U+182DU+1823=gU+0307o
  250. # g followed by vowel u
  251. U+182DU+1824=gU+0307u
  252. # g preceded by vowel a
  253. U+1820U+182D=agU+0307
  254. # g preceded by vowel o
  255. U+1823U+182D=ogU+0307
  256. # g preceded by vowel u
  257. U+1824U+182D=ugU+0307
  258. # g followed by vowel e
  259. U+182DU+1821=ge
  260. # g followed by vowel i
  261. U+182DU+1822=gi
  262. # g followed by vowel oe
  263. U+182DU+1825=goU+0307
  264. # g followed by vowel ue
  265. U+182DU+1826=guU+0307
  266. # g followed by vowel ee
  267. U+182DU+1827=geU+0307
  268. # g preceded by vowel e
  269. U+1821U+182D=eg
  270. # g preceded by vowel i
  271. U+1822U+182D=ig
  272. # g preceded by vowel oe
  273. U+1825U+182D=oU+0307g
  274. # g preceded by vowel ue
  275. U+1826U+182D=uU+0307g
  276. # g preceded by vowel ee
  277. U+1827U+182D=eU+0307g
  278. # q followed by vowel a
  279. U+182CU+1820=qU+0307a
  280. # q followed by vowel o
  281. U+182CU+1823=qU+0307o
  282. # q followed by vowel u
  283. U+182CU+1824=qU+0307u
  284. # q preceded by vowel a (should not occur)
  285. U+1820U+182C=qU+0307a
  286. # q preceded by vowel o (should not occur)
  287. U+1823U+182C=qU+0307o
  288. # q preceded by vowel u (should not occur)
  289. U+1824U+182C=qU+0307u
  290. # k followed by vowel e
  291. U+182CU+1821=ke
  292. # k followed by vowel i
  293. U+182CU+1822=ki
  294. # k followed by vowel oe
  295. U+182CU+1825=koU+0307
  296. # k followed by vowel ue
  297. U+182CU+1826=koU+0307
  298. # k followed by vowel ee
  299. U+182CU+1827=keU+0307
  300. # k preceded by vowel e (should not occur)
  301. U+1821U+182C=ke
  302. # k preceded by vowel i (should not occur)
  303. U+1822U+182C=ki
  304. # k preceded by vowel oe (should not occur)
  305. U+1825U+182C=koU+0307
  306. # k preceded by vowel ue (should not occur)
  307. U+1826U+182C=koU+0307
  308. # k preceded by vowel ee (should not occur)
  309. U+1827U+182C=keU+0307
  310. # non-connecting vowel a
  311. U+180EU+1820=U+002Da
  312. # non-connecting vowel e
  313. U+180EU+1821=U+002De
  314. # Other Mongolian vowel separators to hyphen
  315. U+180E=U+002De
  316. # Narrow no-break space to hyphen
  317. U+202F=U+002D
  318. # Other Mongolian vowel NOT associated with g or k/q
  319. U+1820=a
  320. U+1823=o
  321. U+1826=u
  322. U+1821=e
  323. U+1822=i
  324. U+1825=oU+0307
  325. U+1823=o
  326. U+1824=u
  327. U+1826=uU+0307
  328. U+1827=eU+0307
  329. U+1829=ng
  330. U+1828=n
  331. U+182A=b
  332. U+182B=p
  333. U+182C=q
  334. U+183B=kh
  335. U+183A=kU+0307
  336. U+182C=k
  337. U+182D=gU+0307
  338. U+182E=m
  339. U+1840=lh
  340. U+182F=l
  341. U+183C=tsU+0307
  342. U+1831=sU+0301
  343. U+1830=s
  344. U+1832=t
  345. U+1833=d
  346. U+1834=c
  347. U+1835=j
  348. U+1836=y
  349. U+1837=r
  350. U+1838=v
  351. U+1839=f
  352. U+183F=zr
  353. U+1841=zh
  354. U+1842=ch
  355. U+183E=hU+0307