From d3fbe9a1e6ac3b7a6a87f866fe2ce33e7513fa90 Mon Sep 17 00:00:00 2001 From: Bastien Le Querrec <blq@laquadrature.net> Date: Sun, 24 Mar 2024 01:51:29 +0100 Subject: [PATCH] =?UTF-8?q?pref976:=20ignore=20l'ann=C3=A9e=20des=20dates?= =?UTF-8?q?=20estim=C3=A9es?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit L'année des dates estimées peut être fausse en janvier. --- RAAspotter_pref976.py | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/RAAspotter_pref976.py b/RAAspotter_pref976.py index d0cdc69..39b28b6 100644 --- a/RAAspotter_pref976.py +++ b/RAAspotter_pref976.py @@ -62,7 +62,8 @@ class RAAspotter_pref976(RAAspotter): # Pour chaque mois, on cherche les pages des RAA for month_page in month_pages: - for page_to_parse in self.find_raa_card(month_page['url']): + year = RAAspotter.guess_date(month_page['name'], '(.*)').year + for page_to_parse in self.find_raa_card(month_page['url'], year): sub_pages_to_parse.append(page_to_parse) # On parse les pages contenant des RAA @@ -72,7 +73,7 @@ class RAAspotter_pref976(RAAspotter): self.parse_raa(raa_elements, keywords.split(',')) self.mailer() - def find_raa_card(self, page): + def find_raa_card(self, page, year=None): pages = [] card_pages = self.get_sub_pages_with_pager( page, @@ -83,6 +84,8 @@ class RAAspotter_pref976(RAAspotter): for card_page in card_pages: # On filtre les pages de RAA ne correspondant pas à la période analysée guessed_date = RAAspotter.guess_date(card_page['name'], 'n°[ 0-9]* du ([0-9]*(?:er)? [a-zéû]* [0-9]*)') + if year: + guessed_date = guessed_date.replace(year = year) if guessed_date >= self.not_before: pages.append(card_page['url']) return pages -- GitLab