ArmenianRomanization.cfg 8.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473
  1. # Original table by Randall K. Barry, 19 February 2021
  2. # Corrected 01 March 2021 to fix "E/e" problem and add five special ligatures
  3. # Corrected 18 April 2022 to fix "dz" problem
  4. # Corrected 18 April 2022 to fix "ev/Ev" problems
  5. # Corrected 25 April 2022 to add new "H/h+dot below" mappings
  6. # Corrected 25 April 2022 to add Armenian punctuation mappings
  7. # Corrected 28 April 2022 to add hyphen processing
  8. [General]
  9. Name=Armenian
  10. # UNICODE ARMENIAN CHARACTER RANGE: U+0530-U+058F
  11. [RomanToScript]
  12. FieldsIncluded=100 110 111 130 240 245 246 250 260 264 440 490 600 610 611 630 651 700 710 711 730 740 800 830
  13. SubfieldsAlwaysExcluded=uvxy0123456789
  14. OtherSubfieldsExcludedByTag=100/e 110/e 111/j 246/i 260/c 264/c 650/a 700/e 700/i 710/e 710/i 711/i 711/j 730/i
  15. # RDA boilerplate phrases not transliterated:
  16. Place of publication not identified=Place of publication not identified
  17. publisher not identified=publisher not identified
  18. date of publication not identified=date of publication not identified
  19. At head of title=At head of title
  20. Colophon=Colophon
  21. and others=and others
  22. and one other=and one other
  23. and two others=and two others
  24. and three others=and three others
  25. and four others=and four others
  26. and five others=and five others
  27. and six others=and six others
  28. and seven others=and seven others
  29. and eight others=and eight others
  30. and nine others=and nine others
  31. and ten others=and ten others
  32. and eleven others=and eleven others
  33. and twelve others=and twelve others
  34. and thirteen others=and thirteen others
  35. and fourteen others=and fourteen others
  36. and fifteen others=and fifteen others
  37. and sixteen others=and sixteen others
  38. and seventeen others=and seventeen others
  39. and eighteen others=and eighteen others
  40. and nineteen others=and nineteen others
  41. et al.=et al.
  42. XLIX=XLIX
  43. XLIV=XLIV
  44. XLIII=XLIII
  45. XLII=XLII
  46. XLI=XLI
  47. XLVIII-XLVIII
  48. XLVII=XLVII
  49. XLVI=XLVI
  50. XLV=XLV
  51. XL=XL
  52. LXXXIX=LXXXIX
  53. LXXXIV=LXXXIV
  54. LXXXIII=LXXXIII
  55. LXXXII=LXXXII
  56. LXXXI=LXXXI
  57. LXXXVIII=LXXXVIII
  58. LXXXVII=LXXXVII
  59. LXXXVI=LXXXVI
  60. LXXXV=LXXXV
  61. LXXX=LXXX
  62. LXXIX=LXXIX
  63. LXXIV=LXXIV
  64. LXXIII=LXXIII
  65. LXXII=LXXII
  66. LXXI=LXXI
  67. LXXVIII=LXXVIII
  68. LXXVII=LXXVII
  69. LXXVI=LXXVI
  70. LXXV=LXXV
  71. LXX=LXX
  72. LXIX=XIX
  73. LXIV=LXIV
  74. LXIII=LXIII
  75. LXII=LXII
  76. LXI=LXI
  77. LXVIII=LXVIII
  78. LXVII=LXVII
  79. LXVI=LXVI
  80. LXV=LXV
  81. LX=LX
  82. LIX=LIX
  83. LIV=LIV
  84. LIII=LIII
  85. LII=LII
  86. LI=LI
  87. LVIII=LVIII
  88. LVII=LVII
  89. LVI=LVI
  90. LV=LV
  91. XXXIX=XXXIX
  92. XXXIV=XXXIV
  93. XXXIII=XXXIII
  94. XXXII=XXXII
  95. XXXI=XXXI
  96. XXXVIII=XXXVIII
  97. XXXVII=XXXVII
  98. XXXVI=XXXVI
  99. XXXV=XXXV
  100. XXX=XXX
  101. XXIX=XXIX
  102. XXIV=XXIV
  103. XXIII=XXIII
  104. XXII=XXII
  105. XXI=XXI
  106. XXVIII=XXVIII
  107. XXVII=XXVII
  108. XXVI=XXVI
  109. XXV=XXV
  110. XX=XX
  111. XIX=XIX
  112. XIV=XIV
  113. XIII=XIII
  114. XII=XII
  115. XI=XI
  116. XVIII=XVIII
  117. XVII=XVII
  118. XVI=XVI
  119. XV=XV
  120. IV=IV
  121. VIII=VIII
  122. VII=VII
  123. VI=VI
  124. IX=IX
  125. III=III
  126. II=II
  127. A=U+0531
  128. a=U+0561
  129. B=U+0532
  130. b=U+0562
  131. # GH combination
  132. GH=U+0542
  133. # Gh combination
  134. Gh=U+0542
  135. # gh combination
  136. gh=U+0572
  137. G=U+0533
  138. g=U+0563
  139. # DZ combination
  140. DZ=U+0541
  141. # Dz combination
  142. Dz=U+0541
  143. # dz combination
  144. dz=U+0571
  145. D=U+0534
  146. d=U+0564
  147. # ev combination (lowercase)
  148. ev=U+0587
  149. # EW combination
  150. EW=U+0535U+0582
  151. # Ew combination
  152. Ew=U+0535U+0582
  153. # ew combination
  154. ew=U+0565U+0582
  155. # E+prime+V combination
  156. EU+02B9V=U+0565U+054E
  157. # E+prime+v combination
  158. EU+02B9v=U+0565U+057E
  159. # E+apostophe+V combination
  160. EU+02B9V=U+0565U+054E
  161. # E+apostrophe+v combination
  162. EU+02B9v=U+0565U+057E
  163. # EV combination
  164. EV=U+0565U+054E
  165. # Ev combination
  166. Ev=U+0565U+057E
  167. # E uppercase with macron
  168. EU+0304=U+0537
  169. # e lowercase with macron
  170. eU+0304=U+0567
  171. # E uppercase with caron
  172. EU+030C=U+0538
  173. # e lowercase with caron
  174. eU+030C=U+0568
  175. E=U+0535
  176. e=U+0565
  177. # T uppercase with ayn
  178. TU+02BB=U+0539
  179. # t lowercase with ayn
  180. tU+02BB=U+0569
  181. # ZH combination
  182. ZH=U+053A
  183. # Zh combination
  184. Zh=U+053A
  185. # zh combination
  186. zh=U+056A
  187. Z=U+0536
  188. z=U+0566
  189. I=U+053B
  190. i=U+056B
  191. L=U+053C
  192. l=U+056C
  193. # KH combination
  194. KH=U+053D
  195. # Kh combination
  196. Kh=U+053D
  197. # kh combination
  198. kh=U+056D
  199. # H uppercase with dot below
  200. HU+0323=U+0545
  201. # h lowercase with dot below
  202. hU+0323=U+0575
  203. # TS + ayn combination
  204. TSU+02BB=U+0551
  205. # Ts + ayn combination
  206. TsU+02BB=U+0551
  207. # ts + ayn combination
  208. tsU+02BB=U+0581
  209. # TS combination
  210. TS=U+053E
  211. # Ts combination
  212. Ts=U+053E
  213. # ts combination
  214. ts=U+056E
  215. # K + ayn
  216. KU+02BB=U+0554
  217. # k + ayn
  218. kU+02BB=U+0584
  219. K=U+053F
  220. k=U+056F
  221. # CH + ayn combination
  222. CHU+02BB=U+0549
  223. # Ch + ayn combination
  224. ChU+02BB=U+0549
  225. # ch + ayn combination
  226. chU+02BB=U+0579
  227. # CH combination
  228. CH=U+0543
  229. # Ch combination
  230. Ch=U+0543
  231. # ch combination
  232. ch=U+0573
  233. M=U+0544
  234. m=U+0574
  235. Y=U+0545
  236. y=U+0575
  237. N=U+0546
  238. n=U+0576
  239. # SH combinatiomn
  240. SH=U+0547
  241. # Sh combination
  242. Sh=U+0547
  243. #sh combination
  244. sh=U+0577
  245. H=U+0540
  246. h=U+0570
  247. # O uppercase with combining macron
  248. OU+0304=U+0555
  249. # o lowercase with combining macron
  250. oU+0304=U+0585
  251. O=U+0548
  252. o=U+0578
  253. # P uppercase + ayn
  254. PU+02BB=U+0553
  255. # p lowercase + ayn
  256. pU+02BB=U+0583
  257. J=U+054B
  258. j=U+057B
  259. # R uppercase with combining dot below
  260. RU+0323=U+054C
  261. # r lowercase with combining dot below
  262. rU+0323=U+057C
  263. S=U+054D
  264. P=U+054A
  265. p=U+057A
  266. s=U+057D
  267. V=U+054E
  268. v=U+057E
  269. T=U+054F
  270. t=U+057F
  271. R=U+0550
  272. r=U+0580
  273. W=U+0552
  274. w=U+0582
  275. U=U+0548U+0582
  276. u=U+0578U+0582
  277. F=U+0556
  278. f=U+0586
  279. U+0020U+0022=U+0020U+00AB
  280. U+0022U+0020=U+00BBU+0020
  281. U+02B9=
  282. # Armenian exclamation mark
  283. U+0021=U+055C
  284. # Armenian question mark
  285. U+003F=U+055E
  286. # Armenian comma
  287. U+002C=U+055D
  288. # Armenian period
  289. U+002E=U+0589
  290. # Armenian hyphen
  291. U+002D=U+058A
  292. # Armenian apostrophe
  293. U+0027=U+055A
  294. [ScriptToRoman]
  295. FieldsIncluded=100 110 111 130 240 245 246 250 260 264 440 490 600 610 611 630 651 700 710 711 730 740 800 830
  296. SubfieldsAlwaysExcluded=uvxy0123456789
  297. OtherSubfieldsExcludedByTag=100/e 110/e 111/j 246/i 260/c 264/c 650/a 700/e 700/i 710/e 710/i 711/i 711/j 730/i
  298. # RDA boilerplate phrases not transliterated:
  299. Place of publication not identified=Place of publication not identified
  300. publisher not identified=publisher not identified
  301. U+053FU+0540=KU+02B9H
  302. U+053FU+0570=KU+02B9h
  303. U+056FU+0570=kU+02B9h
  304. U+0536U+0540=ZU+02B9H
  305. U+0536U+0570=ZU+02B9h
  306. U+0566U+0570=zU+02B9h
  307. U+054FU+054D=TU+02B9S
  308. U+054FU+057D=TU+02B9s
  309. U+057FU+057D=tU+02B9s
  310. U+0534U+0536=DU+02B9Z
  311. U+0534U+0566=DU+02B9z
  312. U+0564U+0566=dU+02B9z
  313. U+0533U+0540=GU+02B9H
  314. U+0533U+0570=GU+02B9h
  315. U+0563U+0570=gU+02B9h
  316. U+054DU+0540=SU+02B9H
  317. U+054DU+0570=SU+02B9h
  318. U+057DU+0570=sU+02B9h
  319. U+0531=A
  320. U+0561=a
  321. U+0532=B
  322. U+0562=b
  323. # Gh combination
  324. U+0542=Gh
  325. # gh combination
  326. U+0572=gh
  327. U+0533=G
  328. U+0563=g
  329. # Dz combination
  330. U+0541U+0566=Dz
  331. # dz combination
  332. U+0571U+0566=dz
  333. U+0534=D
  334. U+0564=d
  335. U+0548U+0582=U
  336. U+0578U+0582=u
  337. # EV combination
  338. U+0537U+054E=EU+02B9V
  339. # Ev combination
  340. U+0537U+057E=EU+05B9v
  341. # ev combination
  342. U+0567U+057E=eU+05B9v
  343. # E uppercase with macron
  344. U+0537=EU+0304
  345. # e lowercase with macron
  346. U+0567=eU+0304
  347. # E uppercase with caron
  348. U+0538=EU+030C
  349. # e lowercase with caron
  350. U+0568=eU+030C
  351. # Ew combination
  352. U+0535U+0582=Ew
  353. # ew combination
  354. U+0565U+0582=ew
  355. # Ev combination
  356. U+0535U+057E=Ev
  357. # ev combination
  358. U+0565U+057E=ev
  359. U+0535=E
  360. U+0565=e
  361. # T uppercase with ayn
  362. U+0539=TU+02BB
  363. # t lowercase with ayn
  364. U+0569=tU+02BB
  365. # Zh combination
  366. U+053A=Zh
  367. # zh combination
  368. U+056A=zh
  369. U+0536=Z
  370. U+0566=z
  371. U+053B=I
  372. U+056B=i
  373. U+053C=L
  374. U+056C=l
  375. # Kh combination
  376. U+053D=Kh
  377. # kh combination
  378. U+056D=kh
  379. # Ts + ayn combination
  380. U+0551=TsU+02BB
  381. # ts + ayn combination
  382. U+0581=tsU+02BB
  383. # Ts combination
  384. U+053E=Ts
  385. # ts combination
  386. U+056E=ts
  387. # K + ayn
  388. U+0554=KU+02BB
  389. # k + ayn
  390. U+0584=kU+02BB
  391. U+053F=K
  392. U+056F=k
  393. # Ch + ayn combination
  394. U+0549=ChU+02BB
  395. # ch + ayn combination
  396. U+0579=chU+02BB
  397. # Ch combination
  398. U+0543=Ch
  399. # ch combination
  400. U+0573=ch
  401. U+0544=M
  402. U+0574=m
  403. # Word-initial uppercase H+dot below
  404. U+0020U+0545=U+0020HU+0323
  405. # Word-initial lowercase h+dot below
  406. U+0020U+0575=U+0020hU+0323
  407. # Word-initial hyphenated uppercase H+dot below
  408. U+002DU+0545=U+002DHU+0323
  409. # Word-initial hyphenated lowercase h+dot below
  410. U+002DU+0575=U+002DhU+0323
  411. U+0545=Y
  412. U+0575=y
  413. U+0546=N
  414. U+0576=n
  415. # Sh combination
  416. U+0547=Sh
  417. # sh combination
  418. U+0577=sh
  419. U+0540=H
  420. U+0570=h
  421. # O uppercase with combining macron
  422. U+0555=OU+0304
  423. # o lowercase with combining macron
  424. U+0585=oU+0304
  425. U+0548=O
  426. U+0578=o
  427. # P uppercase + ayn
  428. U+0553=PU+02BB
  429. # p lowercase + ayn
  430. U+0583=pU+02BB
  431. U+054B=J
  432. U+057B=j
  433. # R uppercase with combining dot below
  434. U+054C=RU+0323
  435. # r lowercase with combining dot below
  436. U+057C=rU+0323
  437. U+054A=P
  438. U+057A=p
  439. U+054D=S
  440. U+057D=s
  441. U+054E=V
  442. U+057E=v
  443. U+054F=T
  444. U+057F=t
  445. U+0550=R
  446. U+0580=r
  447. U+0552=W
  448. U+0582=w
  449. U+0556=F
  450. U+0586=f
  451. U+0587=ev
  452. U+0588=yi
  453. U+FB13=mo
  454. U+FB13=me
  455. U+FB14=mi
  456. U+FB16=vn
  457. U+FB17=mkh
  458. U+055B=
  459. U+055C=!
  460. U+055D=,
  461. U+055E=?
  462. U+0589=.
  463. U+058A=-
  464. U+00AB="
  465. U+00BB="