123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480 |
- # version 1.1
- # Original table by William Kopycki
- # revised by Phong Tran
- # Last updated 19 August 2013
- [General]
- Name=Urdu
- Truncation=%
- [RomanToScript]
- FieldsIncluded=100 110 111 130 240 245 246 250 260 264 440 490 505 600 610 611 630 651 700 710 711 730 740 800 830
- SubfieldsAlwaysExcluded=uvxy0123456789
- OtherSubfieldsExcludedByTag=100/e 110/e 111/j 246/i 260/c 264/c 650/a 700/e 700/i 710/e 710/i 711/i 711/j 730/i
- Subfield6Code=(3
- IncludeFormattingCharactersLcPattern=True
- # RDA boilerplate phrases not transliterated:
- Place of publication not identified=Place of publication not identified
- publisher not identified=publisher not identified
- # Punctuation marks:
- # %=U+066A ; cannot transliterate the truncation character
- *=U+066D
- ,=U+060C
- ;=U+061B
- ?=U+061F
- # Exceptions for specific words
- # Allah
- AllaU+0304h=U+0627U+0644U+0644U+0647
- allaU+0304h=U+0627U+0644U+0644U+0647
- # Qur'an
- QurU+02BCaU+0304n=U+0642U+0631U+0622U+0646
- qurU+02BCaU+0304n=U+0642U+0631U+0622U+0646
- # aur (with spaces)
- aur = U+0627U+0648U+0631
- Aur =U+0627U+0648U+0631
- ####
- # Abdurrahman
- U+02BBAbdurrahU+0323maU+0301n=U+0639U+0628U+062FU+0627U+0644U+0631U+062DU+0645U+0670U+0646
- U+02BBAbdurrahU+0323maU+0304n=U+0639U+0628U+062FU+0627U+0644U+0631U+062DU+0645U+0670U+0646
- # Abd names
- U+02BBAbdulU+02BB=U+0639U+0628U+062FU+0627U+0644U+0639
- U+02BBAbdula=U+0639U+0628U+062FU+0627U+0644
- U+02BBAbdulb=U+0639U+0628U+062FU+0627U+0644U+0628
- U+02BBAbdulf=U+0639U+0628U+062FU+0627U+0644U+0641
- U+02BBAbdulgU+0332hu+0332=U+0639U+0628U+062FU+0627U+0644U+063A
- U+02BBAbdulhU+0323=U+0639U+0628U+062FU+0627U+0644U+062D
- U+02BBAbdulh=U+0639U+0628U+062FU+0627U+0644U+0647
- U+02BBAbdulj=U+0639U+0628U+062FU+0627U+0644U+062C
- U+02BBAbdulkU+0332hU+0332=U+0639U+0628U+062FU+0627U+0644U+062E
- U+02BBAbdulk=U+0639U+0628U+062FU+0627U+0644U+0643
- U+02BBAbdulm=U+0639U+0628U+062FU+0627U+0644U+0645
- U+02BBAbdulq=U+0639U+0628U+062FU+0627U+0644U+0642
- U+02BBAbdulv=U+0639U+0628U+062FU+0627U+0644U+0648
- U+02BBAbdunn=U+0639U+0628U+062FU+0627U+0644U+646
- U+02BBAbdurr=U+0639U+0628U+062FU+0627U+0644U+0631
- U+02BBAbdusU+0323sU+0323=U+0639U+0628U+062FU+0627U+0644U+0325
- U+02BBAbduss=U+0639U+0628U+062FU+0627U+0644U+0633
- U+02BBAbdushsh=U+0639U+0628U+062FU+0627U+0644U+634
- U+02BBAbdutt=U+0639U+0628U+062FU+0627U+0644U+062A
- U+02BBAbduzU+0323zU+0323=U+0639U+0628U+062FU+0627U+0644U+0636
- U+02BBAbduzU+0324zU+0324=U+0639U+0628U+062FU+0627U+0644U+0638
- # Abu names
- AbuU+0304 =U+0627U+0628U+0648U+0020
- AbuU+0304=U+0627U+0628U+0648U+200CU+0627U+0644
- ####
- #lillah
- lillaU+0304h=U+0644U+0644U+0647
- #billah
- billaU+0304h=U+0628U+0644U+0644U+0647
- # Rahman
- RahU+0323maU+0304n=U+0631U+062DU+0645U+0646
- # Nuzhat
- Nuzhat=U+0646U+0632U+0647U+062A
- # Uddin names
- %iU+0304uddiU+0304n=U+0649U+200CU+0627U+0644U+062FU+0651U+064AU+0646
- %uddiU+0304n=U+200CU+0627U+0644U+062FU+0651U+064AU+0646
- # ta'lif
- # Ibn when it appears in the middle of a name sequence
- ibn=U+0628U+0646
- # Abbreviated name elements
- # Ae=U+0627U+06D2
- # Parsing "sh[dot below] as in "Ishaq [name]"
- %shU+0323%=U+0633U+062D
- # Numbers (U+06F0-06F9 for Persian/Urdu)
- # currently *not* valid MARC21 characters
- # 0=U+06F0
- # 1=U+06F1
- # 2=U+06F2
- # 3=U+06F3
- # 4=U+06F4
- # 5=U+06F5
- # 6=U+06F6
- # 7=U+06F7
- # 8=U+06F8
- # 9=U+06F9
- # Postpositions
- # Aspirates [06BE] vs. heh [062D] combinations
- bhU+0323=U+0628U+062D
- Bh=U+0628U+06BE
- bh=U+0628U+06BE
- phU+0323=U+067EU+062D
- Ph=U+067EU+06BE
- ph=U+067EU+06BE
- thU+0323=U+062AU+062D
- Th=U+062AU+06BE
- th=U+062AU+06BE
- tU+0323hU+0323=U+0679U+062D
- TU+0323h=U+0679U+06BE
- tU+0323h=U+0679U+06BE
- jhU+0323=U+062CU+062D
- Jh=U+062CU+06BE
- jh=U+062CU+06BE
- chU+0323=U+0686U+062D
- Ch=U+0686U+06BE
- ch=U+0686U+06BE
- dhU+0323=U+062FU+062D
- Dh=U+062FU+06BE
- dh=U+062FU+06BE
- dU+0323hU+0323=U+0688U+062D
- DU+0323h=U+0688U+06BE
- dU+0323h=U+0688U+06BE
- rU+0323hU+0323=U+0691U+062D
- RU+0323h=U+0691U+06BE
- rU+0323h=U+0691U+06BE
- khU+0323=U+06A9U+062D
- Kh=U+06A9U+06BE
- kh=U+06A9U+06BE
- ghU+0323=U+06AFU+062D
- Gh=U+06AFU+06BE
- gh=U+06AFU+06BE
- # prime = ZWNJ
- U+02B9AU+0304=U+200CU+0622
- U+02B9aU+0304=U+200CU+0622
- aU+0304U+02BCU+02B9=U+0627U+0621U+200C
- iU+0304U+02B9=U+0649U+200C
- U+02B9=U+200C
- # Izafah here
- %aU+0304-yi=U+0627U+0626U+06D2
- %uU+0304-yi=U+0648U+0626U+06D2
- %o-yi=U+0648U+0626U+06D2
- %e-yi=U+06D2
- %iU+0304-yi=U+0649
- %h-yi=U+06C0
- %-yi=U+06C0
- %al-i=U+0644
- %ul-i=U+0644
- %-i=
- # Hyphenated prefixes:
- bi-=U+0628
- al-aU+0304%=U+0627U+0644U+0627
- ul-aU+0304%=U+0627U+0644U+0627
- al-=U+0627U+0644
- ul-=U+0627U+0644
- lil-i=U+0644U+0644
- lil-=U+0644U+0644
- # al-/ul- plus sun letters
- ar-r=U+0627U+0644U+0631
- ur-r=U+0627U+0644U+0631
- ar-R=U+0627U+0644U+0631
- ur-R=U+0627U+0644U+0631
- azU+0332-zU+0332=U+0627U+0644U+0630
- uzU+0332-zU+0332=U+0627U+0644U+0630
- azU+0332-ZU+0332=U+0627U+0644U+0630
- uzU+0332-ZU+0332=U+0627U+0644U+0630
- ad-d=U+0627U+0644U+0627
- ud-d=U+0627U+0644U+0627
- ad-D=U+0627U+0644U+0627
- ud-D=U+0627U+0644U+0627
- asU+0332-sU+0332=U+0627U+0644U+062B
- usU+0332-sU+0332=U+0627U+0644U+062B
- asU+0332-SU+0332=U+0627U+0644U+062B
- usU+0332-SU+0332=U+0627U+0644U+062B
- at-t=U+0627U+0644U+062A
- ut-t=U+0627U+0644U+062A
- at-T=U+0627U+0644U+062A
- ut-T=U+0627U+0644U+062A
- an-n=U+0627U+0644U+0646
- un-n=U+0627U+0644U+0646
- an-N=U+0627U+0644U+0646
- un-N=U+0627U+0644U+0646
- al-l=U+0627U+0644U+0644
- ul-l=U+0627U+0644U+0644
- al-L=U+0627U+0644U+0644
- ul-L=U+0627U+0644U+0644
- azU+0324-zU+0324=U+0627U+0644U+0638
- uzU+0324-zU+0324=U+0627U+0644U+0638
- azU+0324-ZU+0324=U+0627U+0644U+0638
- uzU+0324-ZU+0324=U+0627U+0644U+0638
- atU+0324-tU+0324=U+0627U+0644U+0637
- utU+0324-tU+0324=U+0627U+0644U+0637
- atU+0324-TU+0324=U+0627U+0644U+0637
- utU+0324-TU+0324=U+0627U+0644U+0637
- azU+0323-zU+0323=U+0627U+0644U+0636
- uzU+0323-zU+0323=U+0627U+0644U+0636
- azU+0323-ZU+0323=U+0627U+0644U+0636
- uzU+0323-ZU+0323=U+0627U+0644U+0636
- asU+0323-sU+0323=U+0627U+0644U+0635
- usU+0323-sU+0323=U+0627U+0644U+0635
- asU+0323-SU+0323=U+0627U+0644U+0635
- usU+0323-SU+0323=U+0627U+0644U+0635
- ash-sh=U+0627U+0644U+0634
- ush-sh=U+0627U+0644U+0634
- ash-Sh=U+0627U+0644U+0634
- ush-Sh=U+0627U+0644U+0634
- as-s=U+0627U+0644U+0633
- us-s=U+0627U+0644U+0633
- as-S=U+0627U+0644U+0633
- us-S=U+0627U+0644U+0633
- az-z=U+0627U+0644U+0632
- uz-z=U+0627U+0644U+0632
- az-Z=U+0627U+0644U+0632
- uz-Z=U+0627U+0644U+0632
- # Diphthongs here
- Ae=U+0627U+06D2
- %ai=U+06D2
- Ai=U+0627U+064A
- ai%=U+0627U+064A
- ai=U+064A
- U+02BBAu=U+0639U+0648
- U+02BBau=U+0639U+0648
- Au=U+0627U+0648
- au=U+0648
- # ayn-alif combo
- %U+02BBaU+0304U+02BE=U+0639U+0627U+0621
- %U+02BBaU+0304U+02BC=U+0639U+0627U+0621
- %U+02BBaU+0304%=U+0639U+0627
- # hamza and vowel combo
- # [in final position]
- %uU+0304U+02BEiU+304=U+0648U+0626U+0649
- %uU+0304U+02BCiU+304=U+0648U+0626U+0649
- %U+02BEiU+0304=U+0626U+0649
- %U+02BCiU+0304=U+0626U+0649
- %U+02BEe=U+0626U+06D2
- %U+02BCe=U+0626U+06D2
- %U+02BEuU+0304=U+0624
- %U+02BCuU+0304=U+0624
- %U+02BEo=U+0624
- %U+02BCo=U+0624
- # [in medial position]
- aU+02BEa=U+0623
- aU+02BCa=U+0623
- aU+0304U+02BEa=U+0627U+0621
- aU+0304U+02BCa=U+0627U+0621
- aU+02BEaU+0304=U+0622
- aU+02BCaU+0304=U+0622
- oU+02BEiU+0304=U+0648U+0626U+064A
- oU+02BCiU+0304=U+0648U+0626U+064A
- oU+02BEi=U+0648U+0626
- oU+02BCi=U+0648U+0626
- U+02BEiU+0304=U+0626U+064A
- U+02BCiU+0304=U+0626U+064A
- U+02BEi=U+0626
- U+02BCi=U+0626
- U+02BEe=U+0626U+064A
- U+02BCe=U+0626U+064A
- U+02BEuU+0304=U+0624
- U+02BCuU+0304=U+0624
- uU+0304U+02BE=U+0624
- uU+0304U+02BC=U+0624
- U+02BEo=U+0624
- U+02BCo=U+0624
- oU+02BE=U+0624
- oU+02BC=U+0624
- auU+02BE=U+0624
- auU+02BC=U+0624
- U+02BEa=U+0626
- U+02BCa=U+0626
- %iU+0304=U+0649
- %aU+0301=U+0649U+0670
- # A
- U+02BBAU+0304=U+0639U+0627
- U+02BBaU+0304=U+0639U+0627
- U+02BBA%=U+0639
- U+02BBa=U+0639
- AU+02BB=U+0627U+0639
- aU+02BB%=U+0627U+0639
- aU+02BB=U+0639
- AU+0304%=U+0622
- aU+0304%=U+0622
- aU+0304=U+0627
- aU+0301=U+0649
- ayy=U+064AU+0651
- A%=U+0627
- a%=U+0627
- A=
- a=
- # E
- %e=U+06D2
- E%=U+0627U+064A
- e%=U+0627U+064A
- e=U+064A
- # I
- U+02BBIU+0304=U+0639U+064A
- U+02BBiU+0304=U+0639U+064A
- IU+02BB=U+0627U+0639
- iU+02BB=U+0639
- U+02BBI=U+0639
- IU+0304%=U+0627U+064A
- iU+0304%=U+0627U+064A
- iU+0304y=U+064A
- iU+0304=U+064A
- iyy=U+064AU+0651
- I%=U+0627
- i%=U+0627
- I=U+0627
- i=
- # O
- O%=U+0627U+0648
- o=U+0648
- # U
- U+02BBuU+0304=U+0639U+0648
- U+02BBU=U+0639
- U+02BBu=U+0639
- UU+0304%=U+0627U+0648
- uU+0304%=U+0627U+0648
- uU+0304=U+0648
- U%=U+0627
- u%=U+0627
- U=
- u=
- # Consonants:
- B=U+0628
- bb=U+0628U+0651
- b=U+0628
- P=U+067E
- pp=U+067EU+0651
- p=U+067E
- TU+0323=U+0679
- tU+0323tU+0323=U+0679U+0651
- tU+0323=U+0679
- TU+0324=U+0637
- tU+0324tU+0324=U+0637U+0651
- tU+0324=U+0637
- T=U+062A
- tt=U+062AU+0651
- t=U+062A
- Sh=U+0634
- shsh=U+0634U+0651
- sh=U+0634
- SU+0323=U+0635
- sU+0323sU+0323=U+0635U+0651
- sU+0323=U+0635
- SU+0332=U+062B
- sU+0332sU+0332=U+062BU+0651
- sU+0332=U+062B
- S=U+0633
- ss=U+0633U+0651
- s=U+0633
- J=U+062C
- jj=U+062CU+0651
- j=U+062C
- C=U+0686
- cc=U+0686U+0651
- c=U+0686
- HU+0323=U+062D
- hU+0323hU+0323=U+062DU+0651
- hU+0323=U+062D
- H=U+0647
- hh=U+0647U+0651
- h=U+0647
- KU+0332hU+0332=U+062E
- kU+0332hU+0332kU+0332hU+0332=U+062EU+0651
- kU+0332hU+0332=U+062E
- K=U+06A9
- kk=U+06A9U+0651
- k=U+06A9
- DU+0323=U+0688
- dU+0323dU+0323=U+0688U+0651
- dU+0323=U+0688
- D=U+062F
- dd=U+062FU+0651
- d=U+062F
- ZU+0324=U+0638
- zU+0324zU+0324=U+0638U+0651
- zU+0324=U+0638
- ZU+0323=U+0636
- zU+0323zU+0323=U+0636U+0651
- zU+0323=U+0636
- ZU+0332=U+0630
- zU+0332zU+0332=U+0630U+0651
- zU+0332=U+0630
- zz=U+0632U+0651
- Zh=U+0698
- zhzh=U+0698U+0651
- zh=U+0698
- Z=U+0632
- z=U+0632
- RU+0323=U+0691
- rU+0323rU+0323=U+0691U+0651
- rU+0323=U+0691
- R=U+0631
- rr=U+0631U+0651
- r=U+0631
- GU+0332hU+0332=U+063A
- gU+0332hU+0332gU+0332hU+0332=U+063AU+0651
- gU+0332hU+0332=U+063A
- G=U+06AF
- gg=U+06AFU+0651
- g=U+06AF
- F=U+0641
- ff=U+0641U+0651
- f=U+0641
- Q=U+0642
- qq=U+0642U+0651
- q=U+0642
- L=U+0644
- ll=U+0644U+0651
- l=U+0644
- M=U+0645
- mm=U+0645U+0651
- m=U+0645
- NU+0332=U+06BA
- nU+0332nU+0332=U+06BAU+0651
- nU+0332=U+06BA
- N=U+0646
- nn=U+0646U+0651
- n=U+0646
- V=U+0648
- vv=U+0648U+0651
- v=U+0648
- Y=U+064A
- yy=U+064AU+0651
- y=U+064A
- # ain (alone)
- U+02BB=U+0639
- # hamza (alone in final position)
- %U+02BE=U+0621
- %U+02BC=U+0621
- [ScriptToRoman]
|