|
@@ -311,9 +311,15 @@ roman_to_script:
|
|
"%\u02BC": "\u0621"
|
|
"%\u02BC": "\u0621"
|
|
|
|
|
|
script_to_roman:
|
|
script_to_roman:
|
|
|
|
+ hooks:
|
|
|
|
+ post_normalize:
|
|
|
|
+ -
|
|
|
|
+ - arabic.normalize.camel_normalize
|
|
|
|
+ -
|
|
|
|
+ - arabic.normalize.tashkeel_vocalize
|
|
|
|
+
|
|
map:
|
|
map:
|
|
- # Copy & paste from
|
|
|
|
- # https://www.loc.gov/catdir/cpso/romanization/persian.pdf
|
|
|
|
|
|
+ # From https://www.loc.gov/catdir/cpso/romanization/persian.pdf
|
|
"\u0627": "" # ا
|
|
"\u0627": "" # ا
|
|
"\u0628": "b" # ب
|
|
"\u0628": "b" # ب
|
|
"\u067E": "p" # پ
|
|
"\u067E": "p" # پ
|
|
@@ -331,7 +337,7 @@ script_to_roman:
|
|
"\u0633": "s" # س
|
|
"\u0633": "s" # س
|
|
"\u0634": "sh" # ش
|
|
"\u0634": "sh" # ش
|
|
"\u0635": "\u1E63" # ص
|
|
"\u0635": "\u1E63" # ص
|
|
- "\u0636": "z̤" # ض
|
|
|
|
|
|
+ "\u0636": "z\u0324" # ض
|
|
"\u0637": "\u1E6D" # ط
|
|
"\u0637": "\u1E6D" # ط
|
|
"\u0638": "\u1E93" # ظ
|
|
"\u0638": "\u1E93" # ظ
|
|
"\u0639": "\u2018" # ع
|
|
"\u0639": "\u2018" # ع
|
|
@@ -346,7 +352,7 @@ script_to_roman:
|
|
"\u0648": "v" # و
|
|
"\u0648": "v" # و
|
|
"\u0647": "h" # ه
|
|
"\u0647": "h" # ه
|
|
"\u0629": "h" # ة
|
|
"\u0629": "h" # ة
|
|
- "\u064A": "y" # ي
|
|
|
|
|
|
+ "\u064A": "y" # ي # This looks wrong, this is an Arabic Yeh.
|
|
|
|
|
|
# Vowels and diphthongs
|
|
# Vowels and diphthongs
|
|
"\u064E": "a" # ◌َ
|
|
"\u064E": "a" # ◌َ
|
|
@@ -358,3 +364,6 @@ script_to_roman:
|
|
"\u064E\u0652\u0648": "aw" # ◌َوْ
|
|
"\u064E\u0652\u0648": "aw" # ◌َوْ
|
|
"\u064F\u0648": "\u016B" # ◌ُو
|
|
"\u064F\u0648": "\u016B" # ◌ُو
|
|
"\u064E\u0649\u0648": "ay" # ◌َىْ
|
|
"\u064E\u0649\u0648": "ay" # ◌َىْ
|
|
|
|
+
|
|
|
|
+ # Not in ALA-LC spec sheet
|
|
|
|
+ "\u06CC": "y" # ی Farsi Yeh
|