PushtoRomanization.cfg 6.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407
  1. # version 1.1
  2. # Original table by William Kopycki and Phong Tran
  3. # based on Persian revisions by Michael Chyet and Marzieh Rafi
  4. # Last updated 14 June 2013
  5. [General]
  6. Name=Pushto
  7. Truncation=%
  8. [RomanToScript]
  9. FieldsIncluded=100 110 111 130 245 246 250 260 264 440 490 505 600 610 611 630 651 700 710 711 730 740 800 830
  10. SubfieldsAlwaysExcluded=uvxy0123456789
  11. OtherSubfieldsExcludedByTag=100/e 110/e 111/j 246/i 260/c 264/c 650/a 700/e 700/i 710/e 710/i 711/i 711/j 730/i
  12. Subfield6Code=(3
  13. IncludeFormattingCharactersLcPattern=True
  14. # RDA boilerplate phrases not transliterated:
  15. Place of publication not identified=Place of publication not identified
  16. publisher not identified=publisher not identified
  17. # Punctuation marks:
  18. # %=U+066A ; cannot transliterate the truncation character
  19. *=U+066D
  20. ,=U+060C
  21. ;=U+061B
  22. ?=U+061F
  23. # Exceptions for specific words
  24. # Allah
  25. AllaU+0304h=U+0627U+0644U+0644U+0647
  26. # Qur'an
  27. QurU+02BCaU+0304n=U+0642U+0631U+0622U+0646
  28. # lillah
  29. lillaU+0304h=U+0644U+0644U+0647
  30. # billah
  31. billaU+0304h=U+0628U+0644U+0644U+0647
  32. # Rahman
  33. RahU+0323maU+0304n=U+0631U+062DU+0645U+0646
  34. # ta'lif
  35. # Ibn when it appears in the middle of a name sequence
  36. ibn=U+0628U+0646
  37. # Parsing "sh[dot below] as in "Ishaq [name]"
  38. %shU+0323%=U+0633U+062D
  39. # Edition statements with Latin number
  40. ChaU+0304p-i 1=U+0686U+0627U+067E 1
  41. ChaU+0304p-i 2=U+0686U+0627U+067E 2
  42. ChaU+0304p-i 3=U+0686U+0627U+067E 3
  43. ChaU+0304p-i 4=U+0686U+0627U+067E 4
  44. ChaU+0304p-i 5=U+0686U+0627U+067E 5
  45. ChaU+0304p-i 6=U+0686U+0627U+067E 6
  46. ChaU+0304p-i 7=U+0686U+0627U+067E 7
  47. ChaU+0304p-i 8=U+0686U+0627U+067E 8
  48. ChaU+0304p-i 9=U+0686U+0627U+067E 9
  49. # Numbers (Extended Arabic U+06F0-06F9 for Persian)
  50. # currently *not* valid MARC21 characters
  51. # 0=U+06F0
  52. # 1=U+06F1
  53. # 2=U+06F2
  54. # 3=U+06F3
  55. # 4=U+06F4
  56. # 5=U+06F5
  57. # 6=U+06F6
  58. # 7=U+06F7
  59. # 8=U+06F8
  60. # 9=U+06F9
  61. # Use Basic Arabic U+0660-0669, instead:
  62. 0=U+0660
  63. 1=U+0661
  64. 2=U+0662
  65. 3=U+0663
  66. 4=U+0664
  67. 5=U+0665
  68. 6=U+0666
  69. 7=U+0667
  70. 8=U+0668
  71. 9=U+0669
  72. # prime = ZWNJ
  73. U+02B9aU+0304=U+200CU+0622
  74. U+02B9a=U+200CU+0627
  75. %U+02B9iU+0304=U+200CU+0627U+0649
  76. U+02B9iU+0304=U+200CU+0627U+064A
  77. iU+0304U+02B9=U+0649U+200C
  78. aU+0323yU+02B9=U+06D3U+200C
  79. U+02B9=U+200C
  80. # Vowel and vowel/consonant combinations
  81. # and hyphenated suffixes:
  82. # izafah here
  83. %h-U+02BEi=U+06C0
  84. %h-U+02BCi=U+06C0
  85. %-U+02BEi=U+06C0
  86. %-U+02BCi=U+06C0
  87. %h-yi=U+0647U+200CU+0649
  88. %-yi=U+0649
  89. %yi=U+0649
  90. %U+02BEiU+0304=U+0649
  91. %U+02BCiU+0304=U+0649
  92. %iU+0304-i=U+0649
  93. %iU+0304=U+0649
  94. %aU+0323h=U+06C0
  95. %ayy-i=U+0649
  96. %aU+0304y=U+0627U+0649
  97. %aU+0301=U+0649U+0670
  98. %al-i=U+0644
  99. %-i=
  100. # Hyphenated prefixes:
  101. wa-=U+0648
  102. bi-=U+0628
  103. al-=U+0627U+0644
  104. lil-=U+0644U+0644
  105. li-=U+0644
  106. ka-=U+0643
  107. # Diphthongs here
  108. Ayy%=U+0627U+064A
  109. ayy%=U+0627U+064A
  110. %aU+0323y=U+06D3
  111. %ay=U+0649
  112. U+02BBAw=U+0639U+0648
  113. U+02BBaw=U+0639U+0648
  114. Aw=U+0627U+0648
  115. aw=U+0648
  116. # ayn combo
  117. %U+02BBaU+0304%=U+0639U+0627
  118. # alif combos
  119. # [final position]
  120. %aU+0304U+02BE=U+0627U+0621
  121. %aU+0304U+02BC=U+0627U+0621
  122. %aU+0304U+02BEiU+0304=U+0627U+0626U+0649
  123. %aU+0304U+02BCiU+0304=U+0627U+0626U+0649
  124. # [initial position]
  125. AU+0304U+02BEiU+0304%=U+0622U+0626U+064A
  126. AU+0304U+02BCiU+0304%=U+0622U+0626U+064A
  127. aU+0304U+02BEiU+0304%=U+0622U+0626U+064A
  128. aU+0304U+02BCiU+0304%=U+0622U+0626U+064A
  129. # [medial position]
  130. aU+0304U+02BEiU+0304=U+0627U+0626U+064A
  131. aU+0304U+02BCiU+0304=U+0627U+0626U+064A
  132. aU+0304U+02BEi=U+0627U+0626
  133. aU+0304U+02BCi=U+0627U+0626
  134. aU+02BEiU+0304=U+0626U+064A
  135. aU+02BCiU+0304=U+0626U+064A
  136. #a [macron] hamza followed by e
  137. aU+0304U+02BEe=U+0627U+0626U+064A
  138. aU+0304U+02BCe=U+0627U+0626U+064A
  139. # s[dot below]h
  140. SU+0323h=U+069A
  141. sU+0323hsU+0323h=U+069A
  142. sU+0323h=U+069A
  143. # A
  144. U+02BBAU+0304=U+0639U+0627
  145. U+02BBaU+0304=U+0639U+0627
  146. U+02BBA%=U+0639
  147. U+02BBa=U+0639
  148. AU+02BB=U+0623U+0639
  149. aU+02BB=U+0639
  150. aU+02BE=U+0623
  151. aU+02BC=U+0623
  152. U+02BEa=U+0623
  153. U+02BCa=U+0623
  154. aU+0304U+02BE=U+0621
  155. aU+0304U+02BC=U+0621
  156. AU+0304%=U+0622
  157. aU+0304%=U+0622
  158. AU+0304=U+0627
  159. aU+0304=U+0627
  160. AU+0301=U+0649
  161. aU+0301=U+0649
  162. ayy=U+064A
  163. # heh hamzah at end
  164. aU+0323h=U+6C0
  165. A%=U+0627
  166. a%=U+0627
  167. A=
  168. a=
  169. # E
  170. %e=U+06D0
  171. E%=U+0627U+064A
  172. e%=U+0627U+064A
  173. e=U+06D0
  174. # I
  175. IU+02BB%=U+0627U+0639
  176. iU+02BB%=U+0627U+0639
  177. iU+02BB=U+0639
  178. U+02BBI%=U+0639
  179. IU+02BE%=U+0627U+0626
  180. IU+02BC%=U+0627U+0626
  181. iU+02BE=U+0626
  182. iU+02BC=U+0626
  183. U+02BEi=U+0626
  184. U+02BCi=U+0626
  185. IU+0304%=U+0627U+064A
  186. iU+0304%=U+0627U+064A
  187. iU+0304y=U+064A
  188. iU+0304=U+064A
  189. I%=U+0627
  190. i%=U+0627
  191. I=
  192. i=
  193. # O
  194. o%=U+0627U+0648
  195. O%=U+0627U+0648
  196. o=U+0648
  197. # U
  198. # (u [macron] hamza combos)
  199. uU+0304U+02BE=U+0624
  200. uU+0304U+02BC=U+0624
  201. U+02BEuU+0304=U+0626U+0648
  202. U+02BCuU+0304=U+0626U+0648
  203. UU+02BE%=U+0627U+0624
  204. UU+02BC%=U+0627U+0624
  205. uU+02BE=U+0624
  206. uU+02BC=U+0624
  207. UU+0304w%=U+0627U+0628
  208. uU+0304w=U+0628
  209. UU+0304=U+0627U+0648
  210. uU+0304=U+0648
  211. U%=U+0627
  212. u%=U+0627
  213. U=
  214. u=
  215. # Consonants:
  216. B=U+0628
  217. bb=U+0628
  218. b=U+0628
  219. P=U+067E
  220. pp=U+067E
  221. p=U+067E
  222. TU+0324=U+0637
  223. tU+0324tU+0324=U+0637
  224. tU+0324=U+0637
  225. TU+0323=U+067C
  226. tU+0323tU+0323=U+067C
  227. tU+0323=U+067C
  228. T=U+062A
  229. tt=U+062A
  230. t=U+062A
  231. # s[dot]h used to be here
  232. Sh=U+0634
  233. shsh=U+0634
  234. sh=U+0634
  235. SU+0323=U+0635
  236. sU+0323sU+0323=U+0635
  237. sU+0323=U+0635
  238. SU+0332=U+062B
  239. sU+0332sU+0332=U+062B
  240. sU+0332=U+062B
  241. SU+0307=U+0685
  242. sU+0307sU+0307=U+0685
  243. sU+0307=U+0685
  244. S=U+0633
  245. ss=U+0633
  246. s=U+0633
  247. J=U+062C
  248. jj=U+062C
  249. j=U+062C
  250. Ch=U+0686
  251. chch=U+0686
  252. ch=U+0686
  253. HU+0323=U+062D
  254. hU+0323hU+0323=U+062D
  255. hU+0323=U+062D
  256. H=U+0647
  257. hh=U+0647
  258. h=U+0647
  259. Kh=U+062E
  260. khkh=U+062E
  261. kh=U+062E
  262. K=U+06A9
  263. kk=U+06A9
  264. k=U+06A9
  265. # particle da
  266. DaU+0020=U+062FU+0020
  267. daU+0020=U+062FU+0020
  268. DU+0323=U+0689
  269. dU+0323dU+0323=U+0689
  270. dU+0323=U+0689
  271. D=U+062F
  272. dd=U+062F
  273. d=U+062F
  274. ZU+0323h=U+0696
  275. zU+0323hzU+0323h=U+0696
  276. zU+0323h=U+0696
  277. Zh=U+0698
  278. zhzh=U+0698
  279. zh=U+0698
  280. ZU+0324=U+0638
  281. zU+0324zU+0324=U+0638
  282. zU+0324=U+0638
  283. ZU+0323=U+0636
  284. zU+0323zU+0323=U+0636
  285. zU+0323=U+0636
  286. ZU+0332=U+0630
  287. zU+0332zU+0332=U+0630
  288. zU+0332=U+0630
  289. ZU+0307=U+0681
  290. zU+0307zU+0307=U+0681
  291. zU+0307=U+0681
  292. Z=U+0632
  293. zz=U+0632
  294. z=U+0632
  295. RU+0323=U+0693
  296. rU+0323rU+0323=U+0693
  297. rU+0323=U+0693
  298. R=U+0631
  299. rr=U+0631
  300. r=U+0631
  301. Gh=U+063A
  302. ghgh=U+063A
  303. gh=U+063A
  304. G=U+06AB
  305. gg=U+06AB
  306. g=U+06AB
  307. F=U+0641
  308. ff=U+0641
  309. f=U+0641
  310. Q=U+0642
  311. qq=U+0642
  312. q=U+0642
  313. L=U+0644
  314. ll=U+0644
  315. l=U+0644
  316. M=U+0645
  317. mm=U+0645
  318. m=U+0645
  319. NU+0323=U+06BC
  320. nU+0323nU+0323=U+06BC
  321. nU+0323=U+06BC
  322. N=U+0646
  323. nn=U+0646
  324. n=U+0646
  325. W=U+0648
  326. ww=U+0648
  327. w=U+0648
  328. Y=U+064A
  329. y=U+064A
  330. # non-Arabic consonants:
  331. # ain (alone)
  332. U+02BB=U+0639
  333. # hamza (alone in final position)
  334. %U+02BE=U+0621
  335. %U+02BC=U+0621
  336. [ScriptToRoman]