diff --git a/authors-tools/v1/first-name/gender.py b/authors-tools/v1/first-name/gender.py index c93026b..244c974 100644 --- a/authors-tools/v1/first-name/gender.py +++ b/authors-tools/v1/first-name/gender.py @@ -9,13 +9,15 @@ def detector(name,my_dict) : + name = name.replace("'","") if re.match(r"^([A-Z][. '-]+){2,}[A-Z]*",name) or re.match(r"\b[A-Z]+\b\.?",name) : return "name error" else : name = unidecode(name.lower()) name = name.replace(".","") name = name.replace("- ","-") - name = re.split("[\s-]+", name) + name = name.replace("'","") + name = re.split("[,\s-]+", name) ######################## POUR LES PRENOMS SIMPLE. EXEMPLE : BOB ########################################################### if len(name) == 1 : @@ -74,7 +76,8 @@ def main(): - with open('./v1/first-name/name_gender.pickle', 'rb') as handle: + # with open('./v1/first-name/name_gender.pickle', 'rb') as handle: + with open('name_gender.pickle', 'rb') as handle: my_dict = pickle.load(handle) for line in sys.stdin: