derek73 · aikimark · Mar 20, 2021 · Mar 21, 2021 · Mar 22, 2021 · Mar 25, 2021
diff --git a/nameparser/config/__init__.py b/nameparser/config/__init__.py
@@ -231,7 +231,7 @@ def __init__(self,
         self.first_name_titles   = SetManager(first_name_titles)
         self.conjunctions        = SetManager(conjunctions)
         self.capitalization_exceptions = TupleManager(capitalization_exceptions)
-        self.regexes             = TupleManager(regexes)
+        self.regexes             = TupleManager([tpl[:2] for tpl in REGEXES])
         self._pst = None
 
     @property

diff --git a/nameparser/config/regexes.py b/nameparser/config/regexes.py
@@ -18,20 +18,37 @@
         '[\u2600-\u26FF\u2700-\u27BF])+', 
         re.UNICODE)
 
-REGEXES = set([
+REGEXES = [
     ("spaces", re.compile(r"\s+", re.U)),
     ("word", re.compile(r"(\w|\.)+", re.U)),
     ("mac", re.compile(r'^(ma?c)(\w{2,})', re.I | re.U)),
     ("initial", re.compile(r'^(\w\.|[A-Z])?$', re.U)),
-    ("quoted_word", re.compile(r'(?<!\w)\'([^\s]*?)\'(?!\w)', re.U)),
-    ("double_quotes", re.compile(r'\"(.*?)\"', re.U)),
-    ("parenthesis", re.compile(r'\((.*?)\)', re.U)),
+    ("double_apostrophe_ASCII", re.compile(r"(?!\w)''(\w[^']*?)''(?!\w)", re.U), 'nickname'),
+    ("smart_quote", re.compile(r"(?!\w)“(\w[^”]*?)”(?!\w)", re.U), 'nickname'),
+    ("smart_single_quote", re.compile(r"(?!\w)‘(\w[^’]*?)’(?!\w)", re.U), 'nickname'),
+    ("grave_accent", re.compile(r'(?!\w)`(\w[^`]*?)`(?!\w)', re.U), 'nickname'),
+    ("grave_acute", re.compile(r'(?!\w)`(\w[^´]*?)´(?!\w)', re.U), 'nickname'),
+    ("apostrophe_ASCII", re.compile(r"(?!\w)'(\w[^']*?)'(?!\w)", re.U), 'nickname'),
+    ("quote_ASCII", re.compile(r'(?!\w)"(\w[^"]*?)"(?!\w)', re.U), 'nickname'),
+    ("parenthesis", re.compile(r'(?!\w)\((\w[^)]*?)\)(?!\w)', re.U), 'nickname'),
     ("roman_numeral", re.compile(r'^(X|IX|IV|V?I{0,3})$', re.I | re.U)),
     ("no_vowels",re.compile(r'^[^aeyiuo]+$', re.I | re.U)),
     ("period_not_at_end",re.compile(r'.*\..+$', re.I | re.U)),
     ("emoji",re_emoji),
     ("phd", re.compile(r'\s(ph\.?\s+d\.?)', re.I | re.U)),
-])
+]
 """
 All regular expressions used by the parser are precompiled and stored in the config.
+
+REGEX tuple positions are:
+    [0] - name of the pattern, used in code as named attribute
+    [1] - compiled pattern
+    [2] - (optional) label/tag of the pattern, used in code for 
+          filtering patterns
+
+All nickname patterns should follow this pattern: 
+    (?!\w)leading_delim([^trailing_delim]*?)trailing_delim(?!\w)
+
+Nicknames are assume to be delimited by non-word characters.
+
 """
diff --git a/nameparser/config/testREGEXES.py b/nameparser/config/testREGEXES.py
@@ -0,0 +1,49 @@
+# -*- coding: utf-8 -*-
+"""
+Created on Thu Mar 18 04:54:12 2021
+
+@author: New User
+"""
+import re
+
+class TupleManager(dict):
+    '''
+    A dictionary with dot.notation access. Subclass of ``dict``. Makes the tuple constants 
+    more friendly.
+    '''
+    def __getattr__(self, attr):
+        return self.get(attr)
+    __setattr__= dict.__setitem__
+    __delattr__= dict.__delitem__
+
+    def __getstate__(self):
+        return dict(self)
+
+    def __setstate__(self, state):
+        self.__init__(state)
+
+    def __reduce__(self):
+        return (TupleManager, (), self.__getstate__())
+
+REGEXES = [
+    ("spaces", re.compile(r"\s+", re.U)),
+    ("word", re.compile(r"(\w|\.)+", re.U)),
+    ("mac", re.compile(r'^(ma?c)(\w{2,})', re.I | re.U)),
+    ("initial", re.compile(r'^(\w\.|[A-Z])?$', re.U)),
+    ("quoted_word", re.compile(r'(?<!\w)\'([^\s]*?)\'(?!\w)', re.U), 'nickname'),
+    ("double_quotes", re.compile(r'\"(.*?)\"', re.U), 'nickname'),
+    ("parenthesis", re.compile(r'\((.*?)\)', re.U), 'nickname'),
+    #("quoted_word", re.compile(r'(?<!\w)\'([^\s]*?)\'(?!\w)', re.U)),
+    #("double_quotes", re.compile(r'\"(.*?)\"', re.U)),
+    #("parenthesis", re.compile(r'\((.*?)\)', re.U)),
+    ("roman_numeral", re.compile(r'^(X|IX|IV|V?I{0,3})$', re.I | re.U)),
+    ("no_vowels",re.compile(r'^[^aeyiuo]+$', re.I | re.U)),
+    ("period_not_at_end",re.compile(r'.*\..+$', re.I | re.U)),
+    ("phd", re.compile(r'\s(ph\.?\s+d\.?)', re.I | re.U)),
+]
+
+r = TupleManager(tpl[:2] for tpl in REGEXES)
+nn_TM = TupleManager(tpl[:2] for tpl in REGEXES if tpl[-1] == 'nickname')
+nn = [tpl[1] for tpl in REGEXES if tpl[-1] == 'nickname']
+
+rgx = re.compile(r"(?!\w)‘([^’]*?)’(?!\w)", re.U)
diff --git a/nameparser/parser.py b/nameparser/parser.py
@@ -12,6 +12,7 @@
 from nameparser.config import CONSTANTS
 from nameparser.config import Constants
 from nameparser.config import DEFAULT_ENCODING
+from nameparser.config.regexes import REGEXES
 
 ENCODING = 'utf-8'
 
@@ -70,7 +71,7 @@ class HumanName(object):
     _members = ['title','first','middle','last','suffix','nickname']
     unparsable = True
     _full_name = ''
-
+    
     def __init__(self, full_name="", constants=CONSTANTS, encoding=DEFAULT_ENCODING,
                 string_format=None):
         self.C = constants
@@ -79,7 +80,17 @@ def __init__(self, full_name="", constants=CONSTANTS, encoding=DEFAULT_ENCODING,
 
         self.encoding = encoding
         self.string_format = string_format or self.C.string_format
+        self._nickname_regexes = [tpl[1] 
+                                  for tpl in REGEXES
+                                  if isinstance(tpl[-1], str)
+                                  and 'nickname' in tpl[-1]
+                                 ]
         # full_name setter triggers the parse
+        #========================================================
+        #IMPORTANT NOTE:
+        #  The followint statement must be the last one in the 
+        #  __init__ function
+        #========================================================
         self.full_name = full_name
 
     def __iter__(self):
@@ -419,18 +430,14 @@ def parse_nicknames(self):
         white space to allow for quotes in names like O'Connor and Kawai'ae'a.
         Double quotes and parenthesis can span white space.
 
-        Loops through 3 :py:data:`~nameparser.config.regexes.REGEXES`;
-        `quoted_word`, `double_quotes` and `parenthesis`.
+        Loops through :py:data:`~nameparser.config.regexes.REGEXES` with
+        label/tag like "nickname"
         """
 
-        re_quoted_word = self.C.regexes.quoted_word
-        re_double_quotes = self.C.regexes.double_quotes
-        re_parenthesis = self.C.regexes.parenthesis
-
-        for _re in (re_quoted_word, re_double_quotes, re_parenthesis):
+        for _re in self._nickname_regexes:
             if _re.search(self._full_name):
                 self.nickname_list += [x for x in _re.findall(self._full_name)]
-                self._full_name = _re.sub('', self._full_name)
+                self._full_name = _re.sub(' ', self._full_name)
 
     def squash_emoji(self):
         """