PiledHigherAndDeeper: Fix for new website format

This commit is contained in:
Dirk Reiners 2015-01-16 12:06:17 -06:00
parent e25270c866
commit c6f0dd6117

View file

@ -167,12 +167,12 @@ class Pixel(_BasicScraper):
class PiledHigherAndDeeper(_BasicScraper): class PiledHigherAndDeeper(_BasicScraper):
url = 'http://www.phdcomics.com/comics/archive.php' url = 'http://www.phdcomics.com/comics.php'
starter = bounceStarter(url, compile(r'<a href=(archive\.php\?comicid=\d+)><img height=52 width=49 src=images/next_button\.gif border=0 align=middle>')) starter = bounceStarter(url, compile(r'<a href=(archive\.php\?comicid=\d+)>.*<img [^>]*next_button\.gif'))
stripUrl = url + '?comicid=%s' stripUrl = url + '?comicid=%s'
firstStripUrl = stripUrl % '1' firstStripUrl = stripUrl % '1'
imageSearch = compile(tagre("img", "src", r'(http://www\.phdcomics\.com/comics/archive/phd\d+s?\.\w{3,4})', quote="")) imageSearch = compile(tagre("img", "src", r'(http://www\.phdcomics\.com/comics/archive/phd\d+s\d?\.\w{3,4})', quote=""))
prevSearch = compile(r'<a href=(archive\.php\?comicid=\d+)><img height=52 width=49 src=images/prev_button\.gif border=0 align=middle>') prevSearch = compile(r'<a href=((comics/)?archive\.php\?comicid=\d+)>.*<img [^>]*prev_button\.gif')
help = 'Index format: n (unpadded)' help = 'Index format: n (unpadded)'
namer = queryNamer('comicid', usePageUrl=True) namer = queryNamer('comicid', usePageUrl=True)