123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119 |
- general:
- name: Common ignore list.
- roman_to_script:
- ignore:
- - "at head of title"
- - "colophon"
- - "date of publication not identified"
- - "place of publication not identified"
- - "publisher not identified"
- # NOTE There is ambiguity about ignoring these
- # words. Note that the single-character Roman
- # numerals are not included on purpose.
- # Ideally the source editors should use the
- # dedicated U+2160÷U+216F (uppercase Roman
- # numerals) and/or U+2170÷U+217F (lower case Roman
- # numerals) ranges to avoid this ambiguity.
- # TODO implement regular expressions for ignore patterns.
- #- re: "I{2,3}"
- #- re: "I(V|X)"
- #- re: "LI{,3}"
- #- re: "LI?(V|X)"
- #- re: "L(V|X{1,3})I{,3}"
- #- re: "LX{1,3}I?V"
- #- re: "LX{1,3}VI{,3}"
- #- re: "(V|X{1,3})I{,3}"
- #- re: "X{1,3}I{,3}"
- #- re: "X{1,3}I(V|X)"
- #- re: "X{1,3}VI{,3}"
- - "II"
- - "III"
- - "IV"
- - "IX"
- - "LI"
- - "LII"
- - "LIII"
- - "LIV"
- - "LIX"
- - "LV"
- - "LVI"
- - "LVII"
- - "LVIII"
- - "LX"
- - "LXI"
- - "LXII"
- - "LXIII"
- - "LXIV"
- - "LXIX"
- - "LXV"
- - "LXVI"
- - "LXVII"
- - "LXVIII"
- - "LXX"
- - "LXXI"
- - "LXXII"
- - "LXXIII"
- - "LXXIV"
- - "LXXIX"
- - "LXXV"
- - "LXXVI"
- - "LXXVII"
- - "LXXVIII"
- - "LXXX"
- - "LXXXI"
- - "LXXXII"
- - "LXXXIII"
- - "LXXXIV"
- - "LXXXIX"
- - "LXXXV"
- - "LXXXVI"
- - "LXXXVII"
- - "LXXXVIII"
- - "VI"
- - "VII"
- - "VIII"
- - "XI"
- - "XII"
- - "XIII"
- - "XIV"
- - "XIX"
- - "XL"
- - "XLI"
- - "XLII"
- - "XLIII"
- - "XLIV"
- - "XLIX"
- - "XLV"
- - "XLVI"
- - "XLVII"
- - "XLVIII"
- - "XV"
- - "XVI"
- - "XVII"
- - "XVIII"
- - "XX"
- - "XXI"
- - "XXII"
- - "XXIII"
- - "XXIV"
- - "XXIX"
- - "XXV"
- - "XXVI"
- - "XXVII"
- - "XXVIII"
- - "XXX"
- - "XXXI"
- - "XXXII"
- - "XXXIII"
- - "XXXIV"
- - "XXXIX"
- - "XXXV"
- - "XXXVI"
- - "XXXVII"
- - "XXXVIII"
- - "and one other"
- #- re: "and ([a-z0-9]+ )?others"
- - "et al."
|