_ignore_base.yml 918 B

1234567891011121314151617181920212223242526272829303132333435363738
  1. general:
  2. name: Common ignore list.
  3. roman_to_script:
  4. ignore:
  5. - " "
  6. - "at head of title"
  7. - "colophon"
  8. - "date of publication not identified"
  9. - "place of publication not identified"
  10. - "publisher not identified"
  11. # NOTE There is ambiguity about ignoring these
  12. # words. Note that the single-character Roman
  13. # numerals are not included on purpose.
  14. # Ideally the source editors should use the
  15. # dedicated U+2160÷U+216F (uppercase Roman
  16. # numerals) and/or U+2170÷U+217F (lower case Roman
  17. # numerals) ranges to avoid this ambiguity.
  18. - "and one other"
  19. - "et al."
  20. ignore_ptn:
  21. - "and ([a-z0-9]+ )?others"
  22. - "I{2,3}"
  23. - "I(V|X)"
  24. - "LI{,3}"
  25. - "LI?(V|X)"
  26. - "L(V|X{1,3})I{,3}"
  27. - "LX{1,3}I?V"
  28. - "LX{1,3}VI{,3}"
  29. - "(V|X{1,3})I{,3}"
  30. - "X{1,3}I{,3}"
  31. - "X{1,3}I(V|X)"
  32. - "X{1,3}VI{,3}"
  33. script_to_roman:
  34. ignore:
  35. - " "