Fix MonsieurLeChien using archive.org (fixes #240)

This commit is contained in:
Tobias Gruetzmacher 2023-07-18 22:49:49 +02:00
parent 4b98223dad
commit 89db5f31a6
No known key found for this signature in database

View file

@ -165,14 +165,15 @@ class MonkeyUser(_ParserScraper):
return data.xpath('//div[d:class("video-container")]', namespaces=NS) return data.xpath('//div[d:class("video-container")]', namespaces=NS)
class MonsieurLeChien(_BasicScraper): class MonsieurLeChien(ParserScraper):
url = 'http://www.monsieur-le-chien.fr/' url = ('https://web.archive.org/web/20210311002403/'
'http:/www.monsieur-le-chien.fr/')
stripUrl = url + 'index.php?planche=%s' stripUrl = url + 'index.php?planche=%s'
firstStripUrl = stripUrl % '2' firstStripUrl = stripUrl % '2'
lang = 'fr' lang = 'fr'
imageSearch = compile(tagre("img", "src", r'(i/planches/[^"]+)')) imageSearch = '//img[contains(@src,"i/planches/")]'
prevSearch = compile(tagre("a", "href", r'([^"]+)') + prevSearch = '//a[img[contains(@src,"i/precedent.gif")]]'
tagre("img", "src", "i/precedent.gif")) endOfLife = True
help = 'Index format: n' help = 'Index format: n'