Fix some comics.

This commit is contained in:
Bastian Kleineidam 2013-02-18 20:38:44 +01:00
parent 1700229ba1
commit 96edb60e01
3 changed files with 16 additions and 4 deletions

View file

@ -145,7 +145,7 @@ class AstronomyPOTD(_BasicScraper):
stripUrl = 'http://antwrp.gsfc.nasa.gov/apod/ap%s.html' stripUrl = 'http://antwrp.gsfc.nasa.gov/apod/ap%s.html'
imageSearch = compile(r'<a href="(image/\d{4}/[^"]+)"') imageSearch = compile(r'<a href="(image/\d{4}/[^"]+)"')
multipleImagesPerStrip = True multipleImagesPerStrip = True
noImageurls = set(['http://antwrp.gsfc.nasa.gov/apod/ap130218.html']) noImageUrls = set(['http://antwrp.gsfc.nasa.gov/apod/ap130218.html'])
prevSearch = compile(r'<a href="(ap\d{6}\.html)">&lt;</a>') prevSearch = compile(r'<a href="(ap\d{6}\.html)">&lt;</a>')
help = 'Index format: yymmdd' help = 'Index format: yymmdd'

View file

@ -56,6 +56,11 @@ class Blip(_BasicScraper):
prevSearch = compile(r'First.+?"(index.php\?strip_id=.+?)".+?prev') prevSearch = compile(r'First.+?"(index.php\?strip_id=.+?)".+?prev')
help = 'Index format: n' help = 'Index format: n'
@classmethod
def prevUrlModifier(cls, prevUrl):
if prevUrl:
return prevUrl.replace("www.blipcomic.com", "blipcomic.com")
class BlueCrashKit(_BasicScraper): class BlueCrashKit(_BasicScraper):
url = 'http://www.bluecrashkit.com/cheese/' url = 'http://www.bluecrashkit.com/cheese/'
@ -122,6 +127,11 @@ class BoxerHockey(_BasicScraper):
r'[^>]+Previous') r'[^>]+Previous')
help = 'Index format: n (unpadded)' help = 'Index format: n (unpadded)'
@classmethod
def prevUrlModifier(cls, prevUrl):
if prevUrl:
return prevUrl.replace("www.boxerhockey.com", "boxerhockey.fireball20xl.com")
class BroodHollow(_BasicScraper): class BroodHollow(_BasicScraper):
url = 'http://broodhollow.chainsawsuit.com/' url = 'http://broodhollow.chainsawsuit.com/'

View file

@ -29,9 +29,10 @@ class CaseyAndAndy(_BasicScraper):
class CaribbeanBlue(_BasicScraper): class CaribbeanBlue(_BasicScraper):
url = 'http://cblue.katbox.net/' url = 'http://cblue.katbox.net/'
stripUrl = url + 'archive/%s' stripUrl = url + 'comic/%s/'
imageSearch = compile(tagre("img", "src", r'(http://cblue\.katbox\.net/wp-content/webcomic/cblue/[^"]+)')) #http://cblue.katbox.net/wp-content/uploads/cb270en.png?6949c1
prevSearch = compile(tagre("a", "href", r'(http://cblue\.katbox\.net/archive/[^"]+)', after="previous")) imageSearch = compile(tagre("img", "src", r'(http://cblue\.katbox\.net/wp-content/uploads/cb[^"]+)'))
prevSearch = compile(tagre("a", "href", r'(http://cblue\.katbox\.net/comic/[^"]+)', after="previous"))
help = 'Index format: nnn-stripname' help = 'Index format: nnn-stripname'
@ -200,6 +201,7 @@ class CyanideAndHappiness(_BasicScraper):
stripUrl = url + '%s/' stripUrl = url + '%s/'
imageSearch = compile(tagre("img", "src", r'(http://(?:www\.)?explosm\.net/db/files/[^"]+)', before="a daily webcomic")) imageSearch = compile(tagre("img", "src", r'(http://(?:www\.)?explosm\.net/db/files/[^"]+)', before="a daily webcomic"))
prevSearch = compile(tagre("a", "href", r'(/comics/\d+/)', before="prev")) prevSearch = compile(tagre("a", "href", r'(/comics/\d+/)', before="prev"))
noImageUrls = set(["http://www.explosm.net/comics/3082/"])
help = 'Index format: n (unpadded)' help = 'Index format: n (unpadded)'
@classmethod @classmethod