Explorar o código

Add ignore list to Armenian.

Stefano Cossu %!s(int64=2) %!d(string=hai) anos
pai
achega
7c89cac36f
Modificáronse 1 ficheiros con 114 adicións e 0 borrados
  1. 114 0
      transliterator/tables/data/armenian.yml

+ 114 - 0
transliterator/tables/data/armenian.yml

@@ -2,6 +2,120 @@ general:
   name: Armenian
 
 roman_to_script:
+  ignore:
+    - "at head of title"
+    - "colophon"
+    - "date of publication not identified"
+    - "place of publication not identified"
+    - "publisher not identified"
+    # NOTE There is ambiguity about ignoring these
+    # words. Note that the single-character Roman
+    # numerals are not included on purpose.
+    # Ideally the source editors should use the
+    # dedicated U+2160÷U+216F (uppercase Roman
+    # numerals) and/or U+2170÷U+217F (lower case Roman
+    # numerals) ranges to avoid this ambiguity.
+    # TODO implement regular expressions for ignore patterns.
+    #- re: "I{2,3}"
+    #- re: "I(V|X)"
+    #- re: "LI{,3}"
+    #- re: "LI?(V|X)"
+    #- re: "L(V|X{1,3})I{,3}"
+    #- re: "LX{1,3}I?V"
+    #- re: "LX{1,3}VI{,3}"
+    #- re: "(V|X{1,3})I{,3}"
+    #- re: "X{1,3}I{,3}"
+    #- re: "X{1,3}I(V|X)"
+    #- re: "X{1,3}VI{,3}"
+    - "II"
+    - "III"
+    - "IV"
+    - "IX"
+    - "LI"
+    - "LII"
+    - "LIII"
+    - "LIV"
+    - "LIX"
+    - "LV"
+    - "LVI"
+    - "LVII"
+    - "LVIII"
+    - "LX"
+    - "LXI"
+    - "LXII"
+    - "LXIII"
+    - "LXIV"
+    - "LXIX"
+    - "LXV"
+    - "LXVI"
+    - "LXVII"
+    - "LXVIII"
+    - "LXX"
+    - "LXXI"
+    - "LXXII"
+    - "LXXIII"
+    - "LXXIV"
+    - "LXXIX"
+    - "LXXV"
+    - "LXXVI"
+    - "LXXVII"
+    - "LXXVIII"
+    - "LXXX"
+    - "LXXXI"
+    - "LXXXII"
+    - "LXXXIII"
+    - "LXXXIV"
+    - "LXXXIX"
+    - "LXXXV"
+    - "LXXXVI"
+    - "LXXXVII"
+    - "LXXXVIII"
+    - "VI"
+    - "VII"
+    - "VIII"
+    - "XI"
+    - "XII"
+    - "XIII"
+    - "XIV"
+    - "XIX"
+    - "XL"
+    - "XLI"
+    - "XLII"
+    - "XLIII"
+    - "XLIV"
+    - "XLIX"
+    - "XLV"
+    - "XLVI"
+    - "XLVII"
+    - "XLVIII"
+    - "XV"
+    - "XVI"
+    - "XVII"
+    - "XVIII"
+    - "XX"
+    - "XXI"
+    - "XXII"
+    - "XXIII"
+    - "XXIV"
+    - "XXIX"
+    - "XXV"
+    - "XXVI"
+    - "XXVII"
+    - "XXVIII"
+    - "XXX"
+    - "XXXI"
+    - "XXXII"
+    - "XXXIII"
+    - "XXXIV"
+    - "XXXIX"
+    - "XXXV"
+    - "XXXVI"
+    - "XXXVII"
+    - "XXXVIII"
+    - "and one other"
+    #- re: "and ([a-z0-9]+ )?others"
+    - "et al."
+
   map:
     "A": "\u0531"
     "a": "\u0561"