KyrgyzRomanization.cfg 5.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297
  1. # Original table by Randall K. Barry, 08 March 2021
  2. [General]
  3. Name=Kyrgyz
  4. # UNICODE CYRILLIC CHARACTER RANGE: U+0400-U+052F
  5. # This configuration file maps all valid Unicode used in the Kyrgyz
  6. # and Russian languages written in the Cyrillic script
  7. [RomanToScript]
  8. FieldsIncluded=100 110 111 130 240 245 246 250 260 264 440 490 600 610 611 630 651 700
  9. 710 711 730 740 800 830
  10. SubfieldsAlwaysExcluded=uvxy0123456789
  11. OtherSubfieldsExcludedByTag=100/e 110/e 111/j 246/i 260/c 264/c 650/a 700/e 700/i 710/e
  12. 710/i 711/i 711/j 730/i
  13. # RDA boilerplate phrases not transliterated:
  14. Place of publication not identified=Place of publication not identified
  15. publisher not identified=publisher not identified
  16. date of publication not identified=date of publication not identified
  17. At head of title=At head of title
  18. Colophon=Colophon
  19. III=III
  20. IV=IV
  21. VII=VII
  22. VIII=VIII
  23. IX=IX
  24. X=X
  25. XI=XI
  26. XII=XII
  27. XIV=XIV
  28. XV=XV
  29. XVI=XVI
  30. XVII=XVII
  31. XX=XX
  32. XXI=XXI
  33. XXII=XXII
  34. XXIV=XXIV
  35. XXV=XXV
  36. XXVI=XXVI
  37. XXVII=XXVII
  38. XXIX=XXIX
  39. XXX=XXX
  40. XXXI=XXXI
  41. XXXII=XXXII
  42. XXXIV=XXXIV
  43. XXXV=XXXV
  44. XXXVI=XXXVI
  45. XXXVII=XXXVII
  46. XL=XL
  47. LX=LX
  48. LXX=LXX
  49. LXXX=LXXX
  50. # COMMON COMBINING CHARACTERS (always follow a base letter):
  51. # combining grave U+0300
  52. # combining acute U+0301
  53. # combining circumflex U+0302
  54. # combining macron U+0304
  55. # combining breve U+0306
  56. # combining dot above U+0307
  57. # combining diaeresis U+0308
  58. # combining caron (hachek) U+030C
  59. # combining candrabindu U+0310
  60. # combining dot below U+0323
  61. # combining comma below U+0326 (Romanian, Latvian, Livonian)
  62. # combining cedilla U+0327 (French, Turkish, Azeri)
  63. # combining ogonek (hook) U+0328 (Polish, Lithuanian)
  64. # combining left ligature U+FE20 (Cyrillic transliteration)
  65. # combining right ligature U+FE21 (Cyrillic transliteration)
  66. # soft sign/prime (spacing) U+02B9(Cyrillic transliteration)
  67. # hard sign/double prime (spacing) U+02BA (Cyrillic transliteration)
  68. AU+0306=U+04D8
  69. aU+0306=U+04D9
  70. A=U+0410
  71. a=U+0430
  72. B=U+0411
  73. b=U+0431
  74. V=U+0412
  75. v=U+0432
  76. Gh=U+0492
  77. gh=U+0493
  78. GU+0307=U+049C
  79. gU+0307=U+049D
  80. NU+FE20GU+FE21=U+04A2
  81. nU+FE20gU+FE21=U+04A3
  82. G=U+0413
  83. g=U+0433
  84. D=U+0414
  85. d=U+0434
  86. EU+0307=U+042D
  87. EU+0308=U+0401
  88. EU+0328=U+0466
  89. E=U+0415
  90. eU+0307=U+044D
  91. eU+0308=U+0451
  92. eU+0328=U+0467
  93. e=U+0435
  94. ZH=U+0416
  95. Zh=U+0416
  96. Z=U+0417
  97. zh=U+0436
  98. z=U+0437
  99. IU+0304=U+0406
  100. IU+0306=U+0419
  101. IU+0310=U+0408
  102. IU+FE20EU+FE21=U+0462
  103. IU+FE20eU+FE21=U+0462
  104. IU+FE20UU+FE21=U+042E
  105. IU+FE20uU+FE21=U+042E
  106. IU+FE20AU+FE21=U+042F
  107. IU+FE20aU+FE21=U+042F
  108. I=U+0418
  109. iU+0304=U+0456
  110. iU+0306=U+0439
  111. iU+0310=U+0458
  112. iU+FE20eU+FE21=U+0463
  113. iU+FE20uU+FE21=U+044E
  114. iU+FE20aU+FE21=U+044F
  115. i=U+0438
  116. J=U+04B8
  117. j=U+04B9
  118. KH=U+0425
  119. Kh=U+0425
  120. K=U+041A
  121. kh=U+0445
  122. k=U+043A
  123. L=U+041B
  124. l=U+043B
  125. M=U+041C
  126. m=U+043C
  127. N=U+041D
  128. n=U+043D
  129. OU+0307=U+04E8
  130. O=U+041E
  131. oU+0307=U+04E9
  132. o=U+043E
  133. P=U+041F
  134. p=U+043F
  135. Q=U+049A
  136. q=U+049B
  137. R=U+0420
  138. r=U+0440
  139. SHCH=U+0429
  140. Shch=U+0429
  141. SH=U+0428
  142. Sh=U+0428
  143. S=U+0421
  144. shch=U+0449
  145. sh=U+0448
  146. s=U+0441
  147. TU+FE20SU+FE21=U+0426
  148. TU+FE20sU+FE21=U+0426
  149. T=U+0422
  150. tU+FE20sU+FE21=U+0446
  151. t=U+0442
  152. UU+0304=U+04B0
  153. uU+0304=U+04B1
  154. UU+0307=U+04AE
  155. uU+0307=U+04AF
  156. U=U+0423
  157. u=U+0443
  158. FU+0307=U+0472
  159. F=U+0424
  160. fU+0307=U+0473
  161. f=U+0444
  162. CH=U+0427
  163. Ch=U+0427
  164. ch=U+0447
  165. HU+0307=U+04BA
  166. hU+0307=U+04BB
  167. YU+0307=U+0474
  168. Y=U+042B
  169. yU+0307=U+0475
  170. y=U+044B
  171. # this conversion shouldn't be needed, but does no harm
  172. U+FE20=
  173. # this conversion shouldn't be needed, but does no harm
  174. U+FE21=
  175. # this conversion is ambiguous - U+042C is also theoretically possible
  176. U+0027=U+044C
  177. # this conversion is ambiguous - U+042C is also theoretically possible
  178. U+02B9=U+044C
  179. # this conversion is ambiguous - U+044C is also theoretically possible
  180. U+02BA=U+044A
  181. [ScriptToRoman]
  182. FieldsIncluded=100 110 111 130 240 245 246 250 260 264 440 490 600 610 611 630 651 700 710 711 730 740 800 830
  183. SubfieldsAlwaysExcluded=uvxy0123456789
  184. OtherSubfieldsExcludedByTag=100/e 110/e 111/j 246/i 260/c 264/c 650/a 700/e 700/i 710/e 710/i 711/i 711/j 730/i
  185. # RDA boilerplate phrases not transliterated:
  186. Place of publication not identified=Place of publication not identified
  187. publisher not identified=publisher not identified
  188. U+0401=EU+0308
  189. U+0406=IU+0304
  190. U+0408=IU+0310
  191. U+0410=A
  192. U+0411=B
  193. U+0412=V
  194. U+0413=G
  195. U+0414=D
  196. U+0415=E
  197. U+0416=Zh
  198. U+0417=Z
  199. U+0418=I
  200. U+0419=IU+0306
  201. U+041A=K
  202. U+041B=L
  203. U+041C=M
  204. U+041D=N
  205. U+041E=O
  206. U+041F=P
  207. U+0420=R
  208. U+0421=S
  209. U+0422=T
  210. U+0423=U
  211. U+0424=F
  212. U+0425=Kh
  213. U+0426=TU+FE20SU+FE21
  214. U+0427=Ch
  215. U+0428=Sh
  216. U+0429=Shch
  217. U+042A=U+02BA
  218. U+042B=Y
  219. U+042C=U+02B9
  220. U+042D=EU+0307
  221. U+042E=IU+FE20UU+FE21
  222. U+042F=IU+FE20AU+FE21
  223. U+0430=a
  224. U+0431=b
  225. U+0432=v
  226. U+0433=g
  227. U+0434=d
  228. U+0435=e
  229. U+0436=zh
  230. U+0437=z
  231. U+0438=i
  232. U+0439=iU+0306
  233. U+043A=k
  234. U+043B=l
  235. U+043C=m
  236. U+043D=n
  237. U+043E=o
  238. U+043F=p
  239. U+0440=r
  240. U+0441=s
  241. U+0442=t
  242. U+0443=u
  243. U+0444=f
  244. U+0445=kh
  245. U+0446=tU+FE20sU+FE21
  246. U+0447=ch
  247. U+0448=sh
  248. U+0449=shch
  249. U+044A=U+02BA
  250. U+044B=y
  251. U+044C=U+02B9
  252. U+044D=eU+0307
  253. U+044E=iU+FE20uU+FE21
  254. U+044F=iU+FE20aU+FE21
  255. U+0451=eU+0308
  256. U+0456=iU+0304
  257. U+0458=iU+0310
  258. U+0462=IU+FE20EU+FE21
  259. U+0463=iU+FE20eU+FE21
  260. U+0466=EU+0328
  261. U+0467=eU+0328
  262. U+0472=FU+0307
  263. U+0473=fU+0307
  264. U+0474=YU+0307
  265. U+0475=yU+0307
  266. U+0492=Gh
  267. U+0493=gh
  268. U+049A=Q
  269. U+049B=q
  270. U+049C=GU+0307
  271. U+049D=gU+0307
  272. U+04A2=NU+FE20GU+FE21
  273. U+04A3=nU+FE20gU+FE21
  274. U+04AE=UU+0307
  275. U+04AF=uU+0307
  276. U+04B0=UU+0304
  277. U+04B1=uU+0304
  278. U+04B8=J
  279. U+04B9=j
  280. U+04BA=HU+0307
  281. U+04BB=hU+0307
  282. U+04D8=AU+0306
  283. U+04D9=aU+0306
  284. U+04E8=OU+0307
  285. U+04E9=oU+0307
  286.