Amélioration parse du Wix de la puce à l'oreille

This commit is contained in:
Jean-Marie Favreau 2025-04-12 08:33:35 +02:00
parent 516430f9f4
commit b186001132

View File

@ -31,9 +31,12 @@ class CExtractor(TwoStepsExtractor):
title = soup.select("h2")[0].get_text()
start_day = Extractor.parse_french_date(
soup.select("h2")[1].get_text()
) # pas parfait, mais bordel que ce site est mal construit
# pas parfait, mais bordel que ce site est mal construit
for h2 in range(1, 4):
print(soup.select("h2")[h2].get_text())
start_day = Extractor.parse_french_date(soup.select("h2")[h2].get_text())
if start_day is not None:
break
spans = soup.select("div[data-testid=richTextElement] span")
start_time = None