diff --git a/RAAspotter_pref976.py b/RAAspotter_pref976.py index d0cdc69ee144c38cd342fd3c93bd1715610b4cce..39b28b6ce8b8c6597b1192601b8ccea7257ff0c2 100644 --- a/RAAspotter_pref976.py +++ b/RAAspotter_pref976.py @@ -62,7 +62,8 @@ class RAAspotter_pref976(RAAspotter): # Pour chaque mois, on cherche les pages des RAA for month_page in month_pages: - for page_to_parse in self.find_raa_card(month_page['url']): + year = RAAspotter.guess_date(month_page['name'], '(.*)').year + for page_to_parse in self.find_raa_card(month_page['url'], year): sub_pages_to_parse.append(page_to_parse) # On parse les pages contenant des RAA @@ -72,7 +73,7 @@ class RAAspotter_pref976(RAAspotter): self.parse_raa(raa_elements, keywords.split(',')) self.mailer() - def find_raa_card(self, page): + def find_raa_card(self, page, year=None): pages = [] card_pages = self.get_sub_pages_with_pager( page, @@ -83,6 +84,8 @@ class RAAspotter_pref976(RAAspotter): for card_page in card_pages: # On filtre les pages de RAA ne correspondant pas à la période analysée guessed_date = RAAspotter.guess_date(card_page['name'], 'n°[ 0-9]* du ([0-9]*(?:er)? [a-zéû]* [0-9]*)') + if year: + guessed_date = guessed_date.replace(year = year) if guessed_date >= self.not_before: pages.append(card_page['url']) return pages