From c77517b74176d6727ff848b6b007135102ef9be7 Mon Sep 17 00:00:00 2001
From: Bastien Le Querrec <blq@laquadrature.net>
Date: Mon, 6 Jan 2025 22:01:32 +0100
Subject: [PATCH] =?UTF-8?q?prefdpt:=20d=C3=A9tecte=20automatiquement=20la?=
 =?UTF-8?q?=20pr=C3=A9sence=20d'un=20lien=20vers=20un=20RAA?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 Attrap_pref06.py  | 1 -
 Attrap_pref10.py  | 1 -
 Attrap_prefdpt.py | 9 +++++++--
 3 files changed, 7 insertions(+), 4 deletions(-)

diff --git a/Attrap_pref06.py b/Attrap_pref06.py
index 68ad57a..382e21f 100644
--- a/Attrap_pref06.py
+++ b/Attrap_pref06.py
@@ -12,4 +12,3 @@ class Attrap_pref06(Attrap_prefdpt):
 
     # Configuration des widgets à analyser
     Attrap_prefdpt.grey_card['regex']['year'] = 'Année *([0-9]{4})'
-    Attrap_prefdpt.white_card['link_to_raa'] = True
diff --git a/Attrap_pref10.py b/Attrap_pref10.py
index 689748c..08d59ea 100644
--- a/Attrap_pref10.py
+++ b/Attrap_pref10.py
@@ -16,7 +16,6 @@ class Attrap_pref10(Attrap_prefdpt):
 
     # Configuration des widgets à analyser
     Attrap_prefdpt.grey_card['regex']['year'] = 'RAA *([0-9]{4})'
-    Attrap_prefdpt.white_card['link_to_raa'] = True
 
     # On ajoute un widget custom représentant les liens sur la page d'accueil
     Attrap_prefdpt.widgets.append(
diff --git a/Attrap_prefdpt.py b/Attrap_prefdpt.py
index 0e32a04..c83c8dd 100644
--- a/Attrap_prefdpt.py
+++ b/Attrap_prefdpt.py
@@ -20,6 +20,7 @@ class Attrap_prefdpt(Attrap):
             'title': 'div.fr-card.fr-card--sm.fr-card--grey.fr-enlarge-link div.fr-card__body div.fr-card__content h2.fr-card__title a'
         },
         'link_to_raa': False,
+        'autodetect_links_to_raa': True,
         'follow_link_on_unrecognised_date': True
     }
     white_card = {
@@ -33,6 +34,7 @@ class Attrap_prefdpt(Attrap):
             'pager': 'ul.fr-pagination__list li a.fr-pagination__link.fr-pagination__link--next.fr-pagination__link--lg-label'  # Chemin CSS du pager des cartes blanches
         },
         'link_to_raa': False,
+        'autodetect_links_to_raa': True,
         'follow_link_on_unrecognised_date': True
     }
 
@@ -52,11 +54,12 @@ class Attrap_prefdpt(Attrap):
     class DptWidget:
         """Une classe représentant un widget sur le site d'une préfecture de département."""
 
-        def __init__(self, name, regex=None, css_path=None, link_to_raa=False, follow_link_on_unrecognised_date=True):
+        def __init__(self, name, regex=None, css_path=None, link_to_raa=False, autodetect_links_to_raa=True, follow_link_on_unrecognised_date=True):
             self.name = name
             self.regex = regex
             self.css_path = css_path
             self.link_to_raa = link_to_raa
+            self.autodetect_links_to_raa = autodetect_links_to_raa
             self.follow_link_on_unrecognised_date = follow_link_on_unrecognised_date
 
         def has_css_path(self, key):
@@ -96,6 +99,7 @@ class Attrap_prefdpt(Attrap):
                     regex=self.grey_card['regex'],
                     css_path=self.grey_card['css_path'],
                     link_to_raa=self.grey_card['link_to_raa'],
+                    autodetect_links_to_raa=self.grey_card['autodetect_links_to_raa'],
                     follow_link_on_unrecognised_date=self.grey_card['follow_link_on_unrecognised_date']
                 )
             )
@@ -107,6 +111,7 @@ class Attrap_prefdpt(Attrap):
                     regex=self.white_card['regex'],
                     css_path=self.white_card['css_path'],
                     link_to_raa=self.white_card['link_to_raa'],
+                    autodetect_links_to_raa=self.white_card['autodetect_links_to_raa'],
                     follow_link_on_unrecognised_date=self.white_card['follow_link_on_unrecognised_date']
                 )
             )
@@ -171,7 +176,7 @@ class Attrap_prefdpt(Attrap):
                             date = datetime.datetime(9999, 1, 1)
 
                     # Si la configuration indique que les liens renvoient vers un RAA, on ajoute le lien à la liste des éléments
-                    if widget.link_to_raa:
+                    if widget.link_to_raa or (widget.autodetect_links_to_raa and card['url'].endswith('.pdf')):
                         if date.year == 9999:
                             date = None
                         raa = Attrap.RAA(card['url'], date, card['name'].strip(), timezone=self.timezone)
-- 
GitLab