|
@@ -2,6 +2,120 @@ general:
|
|
|
name: Armenian
|
|
|
|
|
|
roman_to_script:
|
|
|
+ ignore:
|
|
|
+ - "at head of title"
|
|
|
+ - "colophon"
|
|
|
+ - "date of publication not identified"
|
|
|
+ - "place of publication not identified"
|
|
|
+ - "publisher not identified"
|
|
|
+ # NOTE There is ambiguity about ignoring these
|
|
|
+ # words. Note that the single-character Roman
|
|
|
+ # numerals are not included on purpose.
|
|
|
+ # Ideally the source editors should use the
|
|
|
+ # dedicated U+2160÷U+216F (uppercase Roman
|
|
|
+ # numerals) and/or U+2170÷U+217F (lower case Roman
|
|
|
+ # numerals) ranges to avoid this ambiguity.
|
|
|
+ # TODO implement regular expressions for ignore patterns.
|
|
|
+ #- re: "I{2,3}"
|
|
|
+ #- re: "I(V|X)"
|
|
|
+ #- re: "LI{,3}"
|
|
|
+ #- re: "LI?(V|X)"
|
|
|
+ #- re: "L(V|X{1,3})I{,3}"
|
|
|
+ #- re: "LX{1,3}I?V"
|
|
|
+ #- re: "LX{1,3}VI{,3}"
|
|
|
+ #- re: "(V|X{1,3})I{,3}"
|
|
|
+ #- re: "X{1,3}I{,3}"
|
|
|
+ #- re: "X{1,3}I(V|X)"
|
|
|
+ #- re: "X{1,3}VI{,3}"
|
|
|
+ - "II"
|
|
|
+ - "III"
|
|
|
+ - "IV"
|
|
|
+ - "IX"
|
|
|
+ - "LI"
|
|
|
+ - "LII"
|
|
|
+ - "LIII"
|
|
|
+ - "LIV"
|
|
|
+ - "LIX"
|
|
|
+ - "LV"
|
|
|
+ - "LVI"
|
|
|
+ - "LVII"
|
|
|
+ - "LVIII"
|
|
|
+ - "LX"
|
|
|
+ - "LXI"
|
|
|
+ - "LXII"
|
|
|
+ - "LXIII"
|
|
|
+ - "LXIV"
|
|
|
+ - "LXIX"
|
|
|
+ - "LXV"
|
|
|
+ - "LXVI"
|
|
|
+ - "LXVII"
|
|
|
+ - "LXVIII"
|
|
|
+ - "LXX"
|
|
|
+ - "LXXI"
|
|
|
+ - "LXXII"
|
|
|
+ - "LXXIII"
|
|
|
+ - "LXXIV"
|
|
|
+ - "LXXIX"
|
|
|
+ - "LXXV"
|
|
|
+ - "LXXVI"
|
|
|
+ - "LXXVII"
|
|
|
+ - "LXXVIII"
|
|
|
+ - "LXXX"
|
|
|
+ - "LXXXI"
|
|
|
+ - "LXXXII"
|
|
|
+ - "LXXXIII"
|
|
|
+ - "LXXXIV"
|
|
|
+ - "LXXXIX"
|
|
|
+ - "LXXXV"
|
|
|
+ - "LXXXVI"
|
|
|
+ - "LXXXVII"
|
|
|
+ - "LXXXVIII"
|
|
|
+ - "VI"
|
|
|
+ - "VII"
|
|
|
+ - "VIII"
|
|
|
+ - "XI"
|
|
|
+ - "XII"
|
|
|
+ - "XIII"
|
|
|
+ - "XIV"
|
|
|
+ - "XIX"
|
|
|
+ - "XL"
|
|
|
+ - "XLI"
|
|
|
+ - "XLII"
|
|
|
+ - "XLIII"
|
|
|
+ - "XLIV"
|
|
|
+ - "XLIX"
|
|
|
+ - "XLV"
|
|
|
+ - "XLVI"
|
|
|
+ - "XLVII"
|
|
|
+ - "XLVIII"
|
|
|
+ - "XV"
|
|
|
+ - "XVI"
|
|
|
+ - "XVII"
|
|
|
+ - "XVIII"
|
|
|
+ - "XX"
|
|
|
+ - "XXI"
|
|
|
+ - "XXII"
|
|
|
+ - "XXIII"
|
|
|
+ - "XXIV"
|
|
|
+ - "XXIX"
|
|
|
+ - "XXV"
|
|
|
+ - "XXVI"
|
|
|
+ - "XXVII"
|
|
|
+ - "XXVIII"
|
|
|
+ - "XXX"
|
|
|
+ - "XXXI"
|
|
|
+ - "XXXII"
|
|
|
+ - "XXXIII"
|
|
|
+ - "XXXIV"
|
|
|
+ - "XXXIX"
|
|
|
+ - "XXXV"
|
|
|
+ - "XXXVI"
|
|
|
+ - "XXXVII"
|
|
|
+ - "XXXVIII"
|
|
|
+ - "and one other"
|
|
|
+ #- re: "and ([a-z0-9]+ )?others"
|
|
|
+ - "et al."
|
|
|
+
|
|
|
map:
|
|
|
"A": "\u0531"
|
|
|
"a": "\u0561"
|