PiledHigherAndDeeper: Fix for new website format
This commit is contained in:
parent
e25270c866
commit
c6f0dd6117
1 changed files with 4 additions and 4 deletions
|
@ -167,12 +167,12 @@ class Pixel(_BasicScraper):
|
||||||
|
|
||||||
|
|
||||||
class PiledHigherAndDeeper(_BasicScraper):
|
class PiledHigherAndDeeper(_BasicScraper):
|
||||||
url = 'http://www.phdcomics.com/comics/archive.php'
|
url = 'http://www.phdcomics.com/comics.php'
|
||||||
starter = bounceStarter(url, compile(r'<a href=(archive\.php\?comicid=\d+)><img height=52 width=49 src=images/next_button\.gif border=0 align=middle>'))
|
starter = bounceStarter(url, compile(r'<a href=(archive\.php\?comicid=\d+)>.*<img [^>]*next_button\.gif'))
|
||||||
stripUrl = url + '?comicid=%s'
|
stripUrl = url + '?comicid=%s'
|
||||||
firstStripUrl = stripUrl % '1'
|
firstStripUrl = stripUrl % '1'
|
||||||
imageSearch = compile(tagre("img", "src", r'(http://www\.phdcomics\.com/comics/archive/phd\d+s?\.\w{3,4})', quote=""))
|
imageSearch = compile(tagre("img", "src", r'(http://www\.phdcomics\.com/comics/archive/phd\d+s\d?\.\w{3,4})', quote=""))
|
||||||
prevSearch = compile(r'<a href=(archive\.php\?comicid=\d+)><img height=52 width=49 src=images/prev_button\.gif border=0 align=middle>')
|
prevSearch = compile(r'<a href=((comics/)?archive\.php\?comicid=\d+)>.*<img [^>]*prev_button\.gif')
|
||||||
help = 'Index format: n (unpadded)'
|
help = 'Index format: n (unpadded)'
|
||||||
namer = queryNamer('comicid', usePageUrl=True)
|
namer = queryNamer('comicid', usePageUrl=True)
|
||||||
|
|
||||||
|
|
Loading…
Reference in a new issue