Ajout des imports Mobilizon

Fix #307
2025-02-12 15:20:25 +01:00
parent b25ae9e354
commit c1234449f7
7 changed files with 254 additions and 1 deletions
--- a/experimentations/get_mobilizon.py
+++ b/experimentations/get_mobilizon.py
@@ -0,0 +1,44 @@
+#!/usr/bin/python3
+# coding: utf-8
+
+import os
+import json
+import sys
+
+# getting the name of the directory
+# where the this file is present.
+current = os.path.dirname(os.path.realpath(__file__))
+ 
+# Getting the parent directory name
+# where the current directory is present.
+parent = os.path.dirname(current)
+ 
+# adding the parent directory to 
+# the sys.path.
+sys.path.append(parent)
+sys.path.append(parent + "/src")
+
+from src.agenda_culturel.import_tasks.downloader import *
+from src.agenda_culturel.import_tasks.extractor import *
+from src.agenda_culturel.import_tasks.importer import *
+from src.agenda_culturel.import_tasks.custom_extractors import *
+
+
+
+
+
+if __name__ == "__main__":
+
+    u2e = URL2Events(SimpleDownloader(), mobilizon.CExtractor())
+    url = "https://mobilizon.fr/@attac63/events?"
+    url_human = "htthttps://mobilizon.fr/@attac63/events"
+
+    try:
+        events = u2e.process(url, url_human, cache = "cache-attac63.html", default_values = {}, published = True)
+
+        exportfile = "events-attac63.json"
+        print("Saving events to file {}".format(exportfile))
+        with open(exportfile, "w") as f:
+            json.dump(events, f, indent=4, default=str)
+    except Exception as e:
+        print("Exception: " + str(e))
--- a/src/agenda_culturel/celery.py
+++ b/src/agenda_culturel/celery.py
@@ -160,6 +160,8 @@ def run_recurrent_import_internal(rimport, downloader, req_id):
        extractor = mille_formes.CExtractor()
    elif rimport.processor == RecurrentImport.PROCESSOR.AMISCERISES:
        extractor = amisdutempsdescerises.CExtractor()
+    elif rimport.processor == RecurrentImport.PROCESSOR.MOBILIZON:
+        extractor = mobilizon.CExtractor()
    else:
        extractor = None

--- a/src/agenda_culturel/import_tasks/custom_extractors/mobilizon.py
+++ b/src/agenda_culturel/import_tasks/custom_extractors/mobilizon.py
@@ -0,0 +1,182 @@
+from ..extractor import *
+import json
+import dateutil.parser
+from datetime import datetime, timezone
+import requests
+from urllib.parse import urlparse
+from bs4 import BeautifulSoup
+
+import logging
+
+logger = logging.getLogger(__name__)
+
+# A class dedicated to get events from les amis du temps des cerises
+# Website https://amisdutempsdescerises.org/
+class CExtractor(Extractor):
+
+    def __init__(self):
+        super().__init__()
+        self.no_downloader = True
+
+    # Source code adapted from https://framagit.org/Marc-AntoineA/mobilizon-client-python
+    def _request(self, body, data):
+
+            headers = {}
+
+            response = requests.post(url=self._api_end_point, json={ "query": body, "variables": data }, headers=headers)
+
+            if response.status_code == 200:
+                response_json = response.json()
+                if 'errors' in response_json:
+                    raise Exception(f'Errors while requesting { body }. { str(response_json["errors"]) }')
+
+                return response_json['data']
+            else:
+                raise Exception(f'Error while requesting. Status code: { response.status_code }')
+
+    def _oncoming_events_number(self):
+
+        query = '''
+query($preferredUsername: String!, $afterDatetime: DateTime) {
+    group(preferredUsername: $preferredUsername) {
+        organizedEvents(afterDatetime: $afterDatetime) {
+            total,
+        }
+    }
+}
+        '''
+        today = datetime.now(timezone.utc).isoformat()
+        data = {
+            'preferredUsername': self._group_id,
+            'afterDatetime': today
+        }
+        r = self._request(query, data)
+        return r['group']['organizedEvents']['total']
+
+
+    def _oncoming_events(self):
+        def _oncoming_events_page(page):
+            query = '''
+query($preferredUsername: String!, $afterDatetime: DateTime, $page: Int) {
+    group(preferredUsername: $preferredUsername) {
+        organizedEvents(afterDatetime: $afterDatetime, page: $page) {
+            elements {
+                id,
+                title,
+                url,
+                beginsOn,
+                endsOn,
+                options {
+                showStartTime,
+                showEndTime,
+                timezone
+                },
+                attributedTo {
+                avatar {
+                    url,
+                }
+                name,
+                preferredUsername,
+                },
+                description,
+                onlineAddress,
+                physicalAddress {
+                locality,
+                description,
+                region
+                },
+                tags {
+                title,
+                id,
+                slug
+                },
+                picture {
+                url
+                },
+                status
+            }
+        }
+    }
+}
+        '''
+
+            today = datetime.now(timezone.utc).isoformat()
+            data = {
+                'preferredUsername': self._group_id,
+                'afterDatetime': today,
+                'page': page
+            }
+            r = self._request(query, data)
+            return r['group']['organizedEvents']['elements']
+
+        number_events = self._oncoming_events_number()
+
+        events = []
+        page = 1
+        while len(events) < number_events:
+            events.extend(_oncoming_events_page(page))
+            page += 1
+        return events
+
+    def extract(
+        self, content, url, url_human=None, default_values=None, published=False
+    ):
+        self.set_header(url)
+        self.clear_events()
+
+        if "@" in url:
+
+            # TODO: quand on a
+            # https://mobilizon.fr/@xr_clermont_ferrand@mobilizon.extinctionrebellion.fr/events
+            # on doit retourner :
+            # https://mobilizon.extinctionrebellion.fr/@xr_clermont_ferrand/events
+
+            # split url to identify server url and actor id
+            elems = [x for x in url.split('/') if len(x) > 0 and x[0] == "@"]
+            if len(elems) == 1:
+                params = elems[0].split('@')
+                if len(params) == 2:
+                    self._api_end_point = "https://" + urlparse(url).netloc + "/api"
+                    self._group_id = params[1]
+                else:
+                    self._api_end_point = "https://" + params[2] + "/api"
+                    self._group_id = params[1]
+
+                events = self._oncoming_events()
+
+
+                for e in events:
+                    title = e["title"]
+                    event_url = e["url"]
+                    image = e["picture"]["url"]
+                    location = e["physicalAddress"]["description"] + ', ' + e["physicalAddress"]["locality"]
+                    soup = BeautifulSoup(e["description"], "html.parser")
+                    
+                    description = soup.text
+                    start = dateutil.parser.isoparse(e["beginsOn"])
+                    end = dateutil.parser.isoparse(e["endsOn"])
+
+                    start_day = start.date()
+                    start_time = start.time() if e["options"]["showStartTime"] else None
+                    end_day = end.date()
+                    end_time = end.time() if e["options"]["showEndTime"] else None
+
+
+                    self.add_event(
+                        default_values,
+                        title,
+                        None,
+                        start_day,
+                        location,
+                        description,
+                        [],
+                        uuids=[event_url],
+                        recurrences=None,
+                        url_human=event_url,
+                        start_time=start_time,
+                        published=published,
+                        image=image,
+                        end_day=end_day,
+                        end_time=end_time)
+        
+        return self.get_structure()
--- a/src/agenda_culturel/import_tasks/extractor.py
+++ b/src/agenda_culturel/import_tasks/extractor.py
@@ -20,6 +20,11 @@ class Extractor(ABC):
        self.events = []
        self.downloader = None
        self.has_2nd_method = False
+
+        # defined it to true in herited classes will
+        # avoid the importer to use the downloader on the url
+        # (used for extractors that are self-sufficient)
+        self.no_downloader = False
        
        # parameters used by the downloader to get the content
        self.referer = ""
--- a/src/agenda_culturel/migrations/0147_alter_recurrentimport_processor.py
+++ b/src/agenda_culturel/migrations/0147_alter_recurrentimport_processor.py
@@ -0,0 +1,18 @@
+# Generated by Django 4.2.9 on 2025-02-12 14:17
+
+from django.db import migrations, models
+
+
+class Migration(migrations.Migration):
+
+    dependencies = [
+        ('agenda_culturel', '0146_alter_recurrentimport_processor'),
+    ]
+
+    operations = [
+        migrations.AlterField(
+            model_name='recurrentimport',
+            name='processor',
+            field=models.CharField(choices=[('ical', 'ical'), ('icalnobusy', 'ical no busy'), ('icalnovc', 'ical no VC'), ('lacoope', 'lacoope.org'), ('lacomedie', 'la comédie'), ('lefotomat', 'le fotomat'), ('lapucealoreille', "la puce à l'oreille"), ('Plugin wordpress MEC', 'Plugin wordpress MEC'), ('Facebook events', "Événements d'une page FB"), ('Billetterie CF', 'Billetterie Clermont-Ferrand'), ('arachnee', 'Arachnée concert'), ('rio', 'Le Rio'), ('raymonde', 'La Raymonde'), ('apidae', 'Agenda apidae tourisme'), ('iguana', 'Agenda iguana (médiathèques)'), ('Mille formes', 'Mille formes'), ('Amis cerises', 'Les Amis du Temps des Cerises'), ('Mobilizon', 'Mobilizon')], default='ical', max_length=20, verbose_name='Processor'),
+        ),
+    ]
--- a/src/agenda_culturel/models.py
+++ b/src/agenda_culturel/models.py
@@ -2135,6 +2135,7 @@ class RecurrentImport(models.Model):
        IGUANA = 'iguana', _('Agenda iguana (médiathèques)')
        MILLEFORMES = 'Mille formes', _('Mille formes')
        AMISCERISES = 'Amis cerises', _('Les Amis du Temps des Cerises')
+        MOBILIZON = 'Mobilizon', _('Mobilizon')

    class DOWNLOADER(models.TextChoices):
        SIMPLE = "simple", _("simple")
--- a/src/requirements.txt
+++ b/src/requirements.txt
@@ -45,4 +45,5 @@ django-cache-cleaner==0.1.0
 emoji==2.14.0
 django-honeypot==1.2.1
 django-autoslug==1.9.9
-django-debug-toolbar-template-profiler==2.1.0
+django-debug-toolbar-template-profiler==2.1.0
+requests==2.32.3