From 1c514631a4e2204e5911123ad766c681516ae868 Mon Sep 17 00:00:00 2001 From: Jean-Marie Favreau Date: Sat, 18 Nov 2023 19:31:49 +0100 Subject: [PATCH] =?UTF-8?q?URL=20facebook=20simplifi=C3=A9e=20des=20=C3=A9?= =?UTF-8?q?l=C3=A9ments=20de=20navigation?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/agenda_culturel/extractors.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/src/agenda_culturel/extractors.py b/src/agenda_culturel/extractors.py index 1f0e9ef..4a02380 100644 --- a/src/agenda_culturel/extractors.py +++ b/src/agenda_culturel/extractors.py @@ -194,6 +194,8 @@ class ExtractorFacebook(Extractor): image = self.get_element("image") local_image = None if image is None else Extractor.download_media(image) + u = urlparse(url) + unique_url = u.scheme + "://" + u.netloc + u.path return Event(title=self.get_element("name"), status=Event.STATUS.DRAFT, @@ -206,7 +208,7 @@ class ExtractorFacebook(Extractor): local_image=local_image, image=self.get_element("image"), image_alt=self.get_element("image_alt"), - reference_urls=[url]) + reference_urls=[unique_url]) def process_page(txt, url):