diff --git a/src/agenda_culturel/import_tasks/custom_extractors/lefotomat.py b/src/agenda_culturel/import_tasks/custom_extractors/lefotomat.py index 2b4ca73..a9951c9 100644 --- a/src/agenda_culturel/import_tasks/custom_extractors/lefotomat.py +++ b/src/agenda_culturel/import_tasks/custom_extractors/lefotomat.py @@ -1,4 +1,5 @@ from bs4 import BeautifulSoup +import re from ..extractor import Extractor from ..twosteps_extractor import TwoStepsExtractor @@ -51,10 +52,17 @@ class CExtractor(TwoStepsExtractor): else: image = None desc = soup.select("head meta[name=description]")[0]["content"] - start_day = Extractor.parse_french_date(desc.split("-")[0]) - start_time = Extractor.parse_french_time(desc.split("-")[1]) - end_time = Extractor.parse_french_time(desc.split("-")[2]) - end_day = Extractor.guess_end_day(start_day, start_time, end_time) + res = re.match("(.*202[5-9])[ -]*([0-9h:]+)[ -]*([0-9h:]*)", desc) + if res: + start_day = Extractor.parse_french_date(res[1]) + start_time = Extractor.parse_french_time(res[2]) + end_time = Extractor.parse_french_time(res[3]) + end_day = Extractor.guess_end_day(start_day, start_time, end_time) + else: + start_day = None + start_time = None + end_time = None + end_day = None location = self.nom_lieu descriptions = soup.select("div.vce-col-content")