|
@@ -24,7 +24,7 @@ class Context:
|
|
|
return self._src
|
|
|
|
|
|
@src.setter
|
|
|
- def src(self):
|
|
|
+ def src(self, _):
|
|
|
raise NotImplementedError("Atribute is read-only.")
|
|
|
|
|
|
@src.deleter
|
|
@@ -110,6 +110,12 @@ def transliterate(src, lang, t_dir="s2r", capitalize=False, options={}):
|
|
|
if _run_hook("post_config", ctx, langsec_hooks) == BREAK:
|
|
|
return getattr(ctx, "dest", ""), ctx.warnings
|
|
|
|
|
|
+ if "normalize" in ctx.langsec:
|
|
|
+ _normalize_src(ctx)
|
|
|
+
|
|
|
+ if _run_hook("post_normalize", ctx, langsec_hooks) == BREAK:
|
|
|
+ return getattr(ctx, "dest", ""), ctx.warnings
|
|
|
+
|
|
|
# Loop through source characters. The increment of each loop depends on
|
|
|
# the length of the token that eventually matches.
|
|
|
ignore_list = langsec.get("ignore", []) # Only present in R2S
|
|
@@ -280,6 +286,12 @@ def transliterate(src, lang, t_dir="s2r", capitalize=False, options={}):
|
|
|
return ctx.dest, ctx.warnings
|
|
|
|
|
|
|
|
|
+def _normalize_src(ctx):
|
|
|
+ for nk, nv in ctx.langsec.get("normalize", {}).items():
|
|
|
+ ctx._src = ctx.src.replace(nk, nv)
|
|
|
+ logger.debug(f"Normalized source: {ctx.src}")
|
|
|
+
|
|
|
+
|
|
|
def _run_hook(hname, ctx, hooks):
|
|
|
ret = None
|
|
|
for hook_def in hooks.get(hname, []):
|