123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121 |
- general:
- name: Common ignore list.
- roman_to_script:
- # Ignore regular expression patterns.
- ignore_ptn:
- # Roman numerals.
- # NOTE There is ambiguity about ignoring these
- # words. Note that the single-character Roman
- # numerals are not included on purpose.
- # Ideally the source editors should use the
- # dedicated U+2160÷U+216F (uppercase Roman
- # numerals) and/or U+2170÷U+217F (lower case Roman
- # numerals) ranges to avoid this ambiguity.
- - "\\<I{2,3}\\>"
- - "\\<I(V|X)\\>"
- - "\\<LI{,3}\\>"
- - "\\<LI?(V|X)\\>"
- - "\\<L(V|X{1,3})I{,3}\\>"
- - "\\<LX{1,3}I?V\\>"
- - "\\<LX{1,3}VI{,3}\\>"
- - "\\<(V|X{1,3})I{,3}\\>"
- - "\\<X{1,3}I{,3}\\>"
- - "\\<X{1,3}I(V|X)\\>"
- - "\\<X{1,3}VI{,3}\\>"
- - "\\<and ([a-z]+ )?others\\>"
- ignore:
- - "at head of title"
- - "colophon"
- - "date of publication not identified"
- - "place of publication not identified"
- - "publisher not identified"
- #- "II"
- #- "III"
- #- "IV"
- #- "IX"
- #- "LI"
- #- "LII"
- #- "LIII"
- #- "LIV"
- #- "LIX"
- #- "LV"
- #- "LVI"
- #- "LVII"
- #- "LVIII"
- #- "LX"
- #- "LXI"
- #- "LXII"
- #- "LXIII"
- #- "LXIV"
- #- "LXIX"
- #- "LXV"
- #- "LXVI"
- #- "LXVII"
- #- "LXVIII"
- #- "LXX"
- #- "LXXI"
- #- "LXXII"
- #- "LXXIII"
- #- "LXXIV"
- #- "LXXIX"
- #- "LXXV"
- #- "LXXVI"
- #- "LXXVII"
- #- "LXXVIII"
- #- "LXXX"
- #- "LXXXI"
- #- "LXXXII"
- #- "LXXXIII"
- #- "LXXXIV"
- #- "LXXXIX"
- #- "LXXXV"
- #- "LXXXVI"
- #- "LXXXVII"
- #- "LXXXVIII"
- #- "VI"
- #- "VII"
- #- "VIII"
- #- "XI"
- #- "XII"
- #- "XIII"
- #- "XIV"
- #- "XIX"
- #- "XL"
- #- "XLI"
- #- "XLII"
- #- "XLIII"
- #- "XLIV"
- #- "XLIX"
- #- "XLV"
- #- "XLVI"
- #- "XLVII"
- #- "XLVIII"
- #- "XV"
- #- "XVI"
- #- "XVII"
- #- "XVIII"
- #- "XX"
- #- "XXI"
- #- "XXII"
- #- "XXIII"
- #- "XXIV"
- #- "XXIX"
- #- "XXV"
- #- "XXVI"
- #- "XXVII"
- #- "XXVIII"
- #- "XXX"
- #- "XXXI"
- #- "XXXII"
- #- "XXXIII"
- #- "XXXIV"
- #- "XXXIX"
- #- "XXXV"
- #- "XXXVI"
- #- "XXXVII"
- #- "XXXVIII"
- - "and one other"
- - "et al."
|