diff --git a/nameparser/config/__init__.py b/nameparser/config/__init__.py index 4f1e4f2..4eaf15b 100644 --- a/nameparser/config/__init__.py +++ b/nameparser/config/__init__.py @@ -231,7 +231,7 @@ def __init__(self, self.first_name_titles = SetManager(first_name_titles) self.conjunctions = SetManager(conjunctions) self.capitalization_exceptions = TupleManager(capitalization_exceptions) - self.regexes = TupleManager(regexes) + self.regexes = TupleManager([tpl[:2] for tpl in REGEXES]) self._pst = None @property diff --git a/nameparser/config/regexes.py b/nameparser/config/regexes.py index bd4b320..9be2f1e 100644 --- a/nameparser/config/regexes.py +++ b/nameparser/config/regexes.py @@ -18,20 +18,39 @@ '[\u2600-\u26FF\u2700-\u27BF])+', re.UNICODE) -REGEXES = set([ +REGEXES = [ ("spaces", re.compile(r"\s+", re.U)), ("word", re.compile(r"(\w|\.)+", re.U)), ("mac", re.compile(r'^(ma?c)(\w{2,})', re.I | re.U)), ("initial", re.compile(r'^(\w\.|[A-Z])?$', re.U)), - ("quoted_word", re.compile(r'(?