1234567891011121314151617181920212223242526272829303132333435363738 |
- general:
- name: Common ignore list.
- roman_to_script:
- ignore:
- - " "
- - "at head of title"
- - "colophon"
- - "date of publication not identified"
- - "place of publication not identified"
- - "publisher not identified"
- # NOTE There is ambiguity about ignoring these
- # words. Note that the single-character Roman
- # numerals are not included on purpose.
- # Ideally the source editors should use the
- # dedicated U+2160÷U+216F (uppercase Roman
- # numerals) and/or U+2170÷U+217F (lower case Roman
- # numerals) ranges to avoid this ambiguity.
- - "and one other"
- - "et al."
- ignore_ptn:
- - "and ([a-z0-9]+ )?others"
- - "I{2,3}"
- - "I(V|X)"
- - "LI{,3}"
- - "LI?(V|X)"
- - "L(V|X{1,3})I{,3}"
- - "LX{1,3}I?V"
- - "LX{1,3}VI{,3}"
- - "(V|X{1,3})I{,3}"
- - "X{1,3}I{,3}"
- - "X{1,3}I(V|X)"
- - "X{1,3}VI{,3}"
- script_to_roman:
- ignore:
- - " "
|