Fix some comics.

This commit is contained in:
Bastian Kleineidam 2013-03-08 06:47:00 +01:00
parent 4c344765ff
commit b368f125bc
4 changed files with 9 additions and 8 deletions

View file

@ -179,9 +179,9 @@ class AstronomyPOTD(_BasicScraper):
def shouldSkipUrl(self, url):
"""Skip pages without images."""
return url in (
'http://antwrp.gsfc.nasa.gov/apod/ap130217.html', # video
'http://antwrp.gsfc.nasa.gov/apod/ap130218.html', # video
'http://antwrp.gsfc.nasa.gov/apod/ap130226.html', # video
self.stripUrl % '130217', # video
self.stripUrl % '130218', # video
self.stripUrl % '130226', # video
)
@classmethod

View file

@ -45,8 +45,8 @@ class CaribbeanBlue(_BasicScraper):
def shouldSkipUrl(self, url):
"""Skip pages without images."""
return url in (
"http://cblue.katbox.net/comic/filler-stall-them/",
"http://cblue.katbox.net/comic/filler-kimi-figurine-now-available/",
self.stripUrl % "filler-stall-them",
self.stripUrl % "filler-kimi-figurine-now-available",
)
@ -219,7 +219,7 @@ class CyanideAndHappiness(_BasicScraper):
def shouldSkipUrl(self, url):
"""Skip pages without images."""
return url == "http://www.explosm.net/comics/3082/"
return url in (self.stripUrl % "3082",)
@classmethod
def namer(cls, imageUrl, pageUrl):

View file

@ -101,7 +101,7 @@ class ToonHole(_BasicScraper):
help = 'Index format: yyyy/mm/stripname'
def shouldSkipUrl(self, url):
return url in ("http://www.toonhole.com/2013/03/if-game-of-thrones-was-animated/",)
return url in (self.stripUrl % "2013/03/if-game-of-thrones-was-animated",)
# XXX disallowed by robots.txt

View file

@ -54,6 +54,7 @@ class Zwarwald(_BasicScraper):
prevSearch = compile(tagre("a", "href", r'(http://www\.zwarwald\.de/index\.php/page/\d+/)') +
tagre("img", "src", r'http://zwarwald\.de/images/prev\.jpg', quote="'"))
help = 'Index format: number'
waitSeconds = 1
def shouldSkipUrl(self, url):
return url in ("http://www.zwarwald.de/index.php/page/112/",)
return url in (self.stripUrl % "112",)