From e1721db311d0a41f6ac9c6a3d4fe165b9fc333e7 Mon Sep 17 00:00:00 2001 From: Jean-Marie Favreau Date: Thu, 17 Oct 2024 10:48:37 +0200 Subject: [PATCH] =?UTF-8?q?On=20nettoie=20l'url=20facebook=20si=20elle=20c?= =?UTF-8?q?ontient=20le=20nom=20de=20l'=C3=A9v=C3=A9nement?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/agenda_culturel/import_tasks/extractor_facebook.py | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/src/agenda_culturel/import_tasks/extractor_facebook.py b/src/agenda_culturel/import_tasks/extractor_facebook.py index d74c1c2..c56167d 100644 --- a/src/agenda_culturel/import_tasks/extractor_facebook.py +++ b/src/agenda_culturel/import_tasks/extractor_facebook.py @@ -237,6 +237,12 @@ class FacebookEventExtractor(Extractor): if FacebookEventExtractor.is_known_url(url): u = urlparse(url) result = "https://www.facebook.com" + u.path + + # remove name in the url + match = re.match(r"(.*/events)/s/([a-zA-Z-][a-zA-Z-0-9]+)/([0-9/]*)", result) + if match: + result = match[1] + "/" + match[3] + if result[-1] == "/": return result[:-1] else: