diff --git a/src/agenda_culturel/import_tasks/extractor.py b/src/agenda_culturel/import_tasks/extractor.py index cd0e081..b86e701 100644 --- a/src/agenda_culturel/import_tasks/extractor.py +++ b/src/agenda_culturel/import_tasks/extractor.py @@ -72,7 +72,7 @@ class Extractor(ABC): def parse_french_date(text, default_year=None, default_year_by_proximity=None): # format NomJour Numero Mois Année m = re.search( - "[a-zA-ZéÉûÛ:.]+[ ]*([0-9]+)[er]*[ ]*([a-zA-ZéÉûÛ:.]+)[ ]*([0-9]+)", + "[a-zA-ZéÉûÛ:.]+[  ]*([0-9]+)[er]*[  ]*([a-zA-ZéÉûÛ:.]+)[  ]*([0-9]+)", text, ) if m: @@ -81,7 +81,7 @@ class Extractor(ABC): year = m.group(3) else: # format Numero Mois Annee - m = re.search("([0-9]+)[er]*[ ]*([a-zA-ZéÉûÛ:.]+)[ ]*([0-9]+)", text) + m = re.search("([0-9]+)[er]*[  ]*([a-zA-ZéÉûÛ:.]+)[  ]*([0-9]+)", text) if m: day = m.group(1) month = Extractor.guess_month(m.group(2)) @@ -95,7 +95,7 @@ class Extractor(ABC): year = m.group(3) else: # format Numero Mois Annee - m = re.search("([0-9]+)[er]*[ ]*([a-zA-ZéÉûÛ:.]+)", text) + m = re.search("([0-9]+)[er]*[  ]*([a-zA-ZéÉûÛ:.]+)", text) if m: day = m.group(1) month = Extractor.guess_month(m.group(2))