diff --git a/pythainlp/util/normalize.py b/pythainlp/util/normalize.py index da1b9bc46..441182d21 100644 --- a/pythainlp/util/normalize.py +++ b/pythainlp/util/normalize.py @@ -38,7 +38,7 @@ f"{follow_v}{lead_v}{above_v}{below_v}\u0e3a\u0e4c\u0e4d\u0e4e" ) _NOREPEAT_PAIRS = list( - zip([f"({ch}[ ]*)+" for ch in _NOREPEAT_CHARS], _NOREPEAT_CHARS) + zip([f"({ch}[ ]*)+{ch}" for ch in _NOREPEAT_CHARS], _NOREPEAT_CHARS) ) _RE_TONEMARKS = re.compile(f"[{tonemarks}]+")