pushto.yml 8.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392
  1. ---
  2. general:
  3. name: Pushto
  4. case_sensitive: false
  5. roman_to_script:
  6. map:
  7. # Punctuation marks:
  8. # %": "\u066A # cannot transliterate the truncation character"
  9. "*": "\u066D"
  10. ",": "\u060C"
  11. ";": "\u061B"
  12. "?": "\u061F"
  13. # Exceptions for specific words
  14. # Allah
  15. "Alla\u0304h": "\u0627\u0644\u0644\u0647"
  16. # Qur'an
  17. "Qur\u02BCa\u0304n": "\u0642\u0631\u0622\u0646"
  18. # lillah
  19. "lilla\u0304h": "\u0644\u0644\u0647"
  20. # billah
  21. "billa\u0304h": "\u0628\u0644\u0644\u0647"
  22. # Rahman
  23. "Rah\u0323ma\u0304n": "\u0631\u062D\u0645\u0646"
  24. # ta'lif
  25. # Ibn when it appears in the middle of a name sequence
  26. "ibn": "\u0628\u0646"
  27. # Parsing "sh[dot below] as in "Ishaq [name]"
  28. "%sh\u0323%": "\u0633\u062D"
  29. # Edition statements with Latin number
  30. "Cha\u0304p-i 1": "\u0686\u0627\u067E 1"
  31. "Cha\u0304p-i 2": "\u0686\u0627\u067E 2"
  32. "Cha\u0304p-i 3": "\u0686\u0627\u067E 3"
  33. "Cha\u0304p-i 4": "\u0686\u0627\u067E 4"
  34. "Cha\u0304p-i 5": "\u0686\u0627\u067E 5"
  35. "Cha\u0304p-i 6": "\u0686\u0627\u067E 6"
  36. "Cha\u0304p-i 7": "\u0686\u0627\u067E 7"
  37. "Cha\u0304p-i 8": "\u0686\u0627\u067E 8"
  38. "Cha\u0304p-i 9": "\u0686\u0627\u067E 9"
  39. # Numbers (Extended Arabic \u06F0-06F9 for Persian)
  40. # currently *not* valid MARC21 characters
  41. "# 0": "\u06F0"
  42. "# 1": "\u06F1"
  43. "# 2": "\u06F2"
  44. "# 3": "\u06F3"
  45. "# 4": "\u06F4"
  46. "# 5": "\u06F5"
  47. "# 6": "\u06F6"
  48. "# 7": "\u06F7"
  49. "# 8": "\u06F8"
  50. "# 9": "\u06F9"
  51. # Use Basic Arabic \u0660-0669, instead:
  52. "0": "\u0660"
  53. "1": "\u0661"
  54. "2": "\u0662"
  55. "3": "\u0663"
  56. "4": "\u0664"
  57. "5": "\u0665"
  58. "6": "\u0666"
  59. "7": "\u0667"
  60. "8": "\u0668"
  61. "9": "\u0669"
  62. "# prime ": " ZWNJ"
  63. "\u02B9a\u0304": "\u200C\u0622"
  64. "\u02B9a": "\u200C\u0627"
  65. "%\u02B9i\u0304": "\u200C\u0627\u0649"
  66. "\u02B9i\u0304": "\u200C\u0627\u064A"
  67. "i\u0304\u02B9": "\u0649\u200C"
  68. "a\u0323y\u02B9": "\u06D3\u200C"
  69. "\u02B9": "\u200C"
  70. # Vowel and vowel/consonant combinations
  71. # and hyphenated suffixes:
  72. # izafah here
  73. "%h-\u02BEi": "\u06C0"
  74. "%h-\u02BCi": "\u06C0 "
  75. "%-\u02BEi": "\u06C0"
  76. "%-\u02BCi": "\u06C0"
  77. "%h-yi": "\u0647\u200C\u0649"
  78. "%-yi": "\u0649"
  79. "%yi": "\u0649"
  80. "%\u02BEi\u0304": "\u0649"
  81. "%\u02BCi\u0304": "\u0649"
  82. "%i\u0304-i": "\u0649"
  83. "%i\u0304": "\u0649"
  84. "%a\u0323h": "\u06C0"
  85. "%ayy-i": "\u0649"
  86. "%a\u0304y": "\u0627\u0649"
  87. "%a\u0301": "\u0649\u0670"
  88. "%al-i": "\u0644"
  89. "%-i": ""
  90. # Hyphenated prefixes:
  91. "wa-": "\u0648"
  92. "bi-": "\u0628"
  93. "al-": "\u0627\u0644"
  94. "lil-": "\u0644\u0644"
  95. "li-": "\u0644"
  96. "ka-": "\u0643"
  97. # Diphthongs here
  98. "Ayy%": "\u0627\u064A"
  99. "ayy%": "\u0627\u064A"
  100. "%a\u0323y": "\u06D3"
  101. "%ay": "\u0649"
  102. "\u02BBAw": "\u0639\u0648"
  103. "\u02BBaw": "\u0639\u0648"
  104. "Aw": "\u0627\u0648"
  105. "aw": "\u0648"
  106. # ayn combo
  107. "%\u02BBa\u0304%": "\u0639\u0627"
  108. # alif combos
  109. # [final position]
  110. "%a\u0304\u02BE": "\u0627\u0621"
  111. "%a\u0304\u02BC": "\u0627\u0621"
  112. "%a\u0304\u02BEi\u0304": "\u0627\u0626\u0649"
  113. "%a\u0304\u02BCi\u0304": "\u0627\u0626\u0649"
  114. # [initial position]
  115. "A\u0304\u02BEi\u0304%": "\u0622\u0626\u064A"
  116. "A\u0304\u02BCi\u0304%": "\u0622\u0626\u064A"
  117. "a\u0304\u02BEi\u0304%": "\u0622\u0626\u064A"
  118. "a\u0304\u02BCi\u0304%": "\u0622\u0626\u064A"
  119. # [medial position]
  120. "a\u0304\u02BEi\u0304": "\u0627\u0626\u064A"
  121. "a\u0304\u02BCi\u0304": "\u0627\u0626\u064A"
  122. "a\u0304\u02BEi": "\u0627\u0626"
  123. "a\u0304\u02BCi": "\u0627\u0626"
  124. "a\u02BEi\u0304": "\u0626\u064A"
  125. "a\u02BCi\u0304": "\u0626\u064A"
  126. #a [macron] hamza followed by e
  127. "a\u0304\u02BEe": "\u0627\u0626\u064A"
  128. "a\u0304\u02BCe": "\u0627\u0626\u064A"
  129. # s[dot below]h
  130. "S\u0323h": "\u069A"
  131. "s\u0323hs\u0323h": "\u069A"
  132. "s\u0323h": "\u069A"
  133. # A
  134. "\u02BBA\u0304": "\u0639\u0627"
  135. "\u02BBa\u0304": "\u0639\u0627"
  136. "\u02BBA%": "\u0639"
  137. "\u02BBa": "\u0639"
  138. "A\u02BB": "\u0623\u0639"
  139. "a\u02BB": "\u0639"
  140. "a\u02BE": "\u0623"
  141. "a\u02BC": "\u0623"
  142. "\u02BEa": "\u0623"
  143. "\u02BCa": "\u0623"
  144. "a\u0304\u02BE": "\u0621"
  145. "a\u0304\u02BC": "\u0621"
  146. "A\u0304%": "\u0622"
  147. "a\u0304%": "\u0622"
  148. "A\u0304": "\u0627"
  149. "a\u0304": "\u0627"
  150. "A\u0301": "\u0649"
  151. "a\u0301": "\u0649"
  152. "ayy": "\u064A"
  153. # heh hamzah at end
  154. "a\u0323h": "\u06C0"
  155. "A%": "\u0627"
  156. "a%": "\u0627"
  157. "A": ""
  158. "a": ""
  159. # E
  160. "%e": "\u06D0"
  161. "E%": "\u0627\u064A"
  162. "e%": "\u0627\u064A"
  163. "e": "\u06D0"
  164. # I
  165. "I\u02BB%": "\u0627\u0639"
  166. "i\u02BB%": "\u0627\u0639"
  167. "i\u02BB": "\u0639"
  168. "\u02BBI%": "\u0639"
  169. "I\u02BE%": "\u0627\u0626"
  170. "I\u02BC%": "\u0627\u0626"
  171. "i\u02BE": "\u0626"
  172. "i\u02BC": "\u0626"
  173. "\u02BEi": "\u0626"
  174. "\u02BCi": "\u0626"
  175. "I\u0304%": "\u0627\u064A"
  176. "i\u0304%": "\u0627\u064A"
  177. "i\u0304y": "\u064A"
  178. "i\u0304": "\u064A"
  179. "I%": "\u0627"
  180. "i%": "\u0627"
  181. "I": ""
  182. "i": ""
  183. # O
  184. "o%": "\u0627\u0648"
  185. "O%": "\u0627\u0648"
  186. "o": "\u0648"
  187. # U
  188. # (u [macron] hamza combos)
  189. "u\u0304\u02BE": "\u0624"
  190. "u\u0304\u02BC": "\u0624"
  191. "\u02BEu\u0304": "\u0626\u0648"
  192. "\u02BCu\u0304": "\u0626\u0648"
  193. "U\u02BE%": "\u0627\u0624"
  194. "U\u02BC%": "\u0627\u0624"
  195. "u\u02BE": "\u0624"
  196. "u\u02BC": "\u0624"
  197. "U\u0304w%": "\u0627\u0628"
  198. "u\u0304w": "\u0628"
  199. "U\u0304": "\u0627\u0648"
  200. "u\u0304": "\u0648"
  201. "U%": "\u0627"
  202. "u%": "\u0627"
  203. "U": ""
  204. "u": ""
  205. # Consonants:
  206. "B": "\u0628"
  207. "bb": "\u0628"
  208. "b": "\u0628"
  209. "P": "\u067E"
  210. "pp": "\u067E"
  211. "p": "\u067E"
  212. "T\u0324": "\u0637"
  213. "t\u0324t\u0324": "\u0637"
  214. "t\u0324": "\u0637"
  215. "T\u0323": "\u067C"
  216. "t\u0323t\u0323": "\u067C"
  217. "t\u0323": "\u067C"
  218. "T": "\u062A"
  219. "tt": "\u062A"
  220. "t": "\u062A"
  221. # s[dot]h used to be here
  222. "Sh": "\u0634"
  223. "shsh": "\u0634"
  224. "sh": "\u0634"
  225. "S\u0323": "\u0635"
  226. "s\u0323s\u0323": "\u0635"
  227. "s\u0323": "\u0635"
  228. "S\u0332": "\u062B"
  229. "s\u0332s\u0332": "\u062B"
  230. "s\u0332": "\u062B"
  231. "S\u0307": "\u0685"
  232. "s\u0307s\u0307": "\u0685"
  233. "s\u0307": "\u0685"
  234. "S": "\u0633"
  235. "ss": "\u0633"
  236. "s": "\u0633"
  237. "J": "\u062C"
  238. "jj": "\u062C"
  239. "j": "\u062C"
  240. "Ch": "\u0686"
  241. "chch": "\u0686"
  242. "ch": "\u0686"
  243. "H\u0323": "\u062D"
  244. "h\u0323h\u0323": "\u062D"
  245. "h\u0323": "\u062D"
  246. "H": "\u0647"
  247. "hh": "\u0647"
  248. "h": "\u0647"
  249. "Kh": "\u062E"
  250. "khkh": "\u062E"
  251. "kh": "\u062E"
  252. "K": "\u06A9"
  253. "kk": "\u06A9"
  254. "k": "\u06A9"
  255. # particle da
  256. "Da\u0020": "\u062F\u0020"
  257. "da\u0020": "\u062F\u0020"
  258. "D\u0323": "\u0689"
  259. "d\u0323d\u0323": "\u0689"
  260. "d\u0323": "\u0689"
  261. "D": "\u062F"
  262. "dd": "\u062F"
  263. "d": "\u062F"
  264. "Z\u0323h": "\u0696"
  265. "z\u0323hz\u0323h": "\u0696"
  266. "z\u0323h": "\u0696"
  267. "Zh": "\u0698"
  268. "zhzh": "\u0698"
  269. "zh": "\u0698"
  270. "Z\u0324": "\u0638"
  271. "z\u0324z\u0324": "\u0638"
  272. "z\u0324": "\u0638"
  273. "Z\u0323": "\u0636"
  274. "z\u0323z\u0323": "\u0636"
  275. "z\u0323": "\u0636"
  276. "Z\u0332": "\u0630"
  277. "z\u0332z\u0332": "\u0630"
  278. "z\u0332": "\u0630"
  279. "Z\u0307": "\u0681"
  280. "z\u0307z\u0307": "\u0681"
  281. "z\u0307": "\u0681"
  282. "Z": "\u0632"
  283. "zz": "\u0632"
  284. "z": "\u0632"
  285. "R\u0323": "\u0693"
  286. "r\u0323r\u0323": "\u0693"
  287. "r\u0323": "\u0693"
  288. "R": "\u0631"
  289. "rr": "\u0631"
  290. "r": "\u0631"
  291. "Gh": "\u063A"
  292. "ghgh": "\u063A"
  293. "gh": "\u063A"
  294. "G": "\u06AB"
  295. "gg": "\u06AB"
  296. "g": "\u06AB"
  297. "F": "\u0641"
  298. "ff": "\u0641"
  299. "f": "\u0641"
  300. "Q": "\u0642"
  301. "qq": "\u0642"
  302. "q": "\u0642"
  303. "L": "\u0644"
  304. "ll": "\u0644"
  305. "l": "\u0644"
  306. "M": "\u0645"
  307. "mm": "\u0645"
  308. "m": "\u0645"
  309. "N\u0323": "\u06BC"
  310. "n\u0323n\u0323": "\u06BC"
  311. "n\u0323": "\u06BC"
  312. "N": "\u0646"
  313. "nn": "\u0646"
  314. "n": "\u0646"
  315. "W": "\u0648"
  316. "ww": "\u0648"
  317. "w": "\u0648"
  318. "Y": "\u064A"
  319. "y": "\u064A"
  320. # non-Arabic consonants:
  321. # ain (alone)
  322. "\u02BB": "\u0639"
  323. # hamza (alone in final position)
  324. "%\u02BE": "\u0621"
  325. "%\u02BC": "\u0621"