fixing KatzenfutterGeleespritzer
This commit is contained in:
parent
8a245e1d10
commit
3edaa97fb9
2 changed files with 4 additions and 16 deletions
|
@ -7,7 +7,9 @@ def add(name, url, firstUrl=None, lang=None):
|
||||||
name=name,
|
name=name,
|
||||||
url=url,
|
url=url,
|
||||||
imageSearch='//div[@id="comic"]//img',
|
imageSearch='//div[@id="comic"]//img',
|
||||||
prevSearch=['//a[contains(text(), " Prev")]', "//a[contains(concat(' ', @class, ' '), ' navi-prev ')]"]
|
prevSearch=['//a[contains(text(), " Prev")]',
|
||||||
|
"//a[contains(concat(' ', @class, ' '), ' navi-prev ')]",
|
||||||
|
"//a[contains(concat(' ', @class, ' '), ' navi-prev-in ')]"]
|
||||||
)
|
)
|
||||||
if lang:
|
if lang:
|
||||||
attrs['lang'] = lang
|
attrs['lang'] = lang
|
||||||
|
@ -19,6 +21,7 @@ def add(name, url, firstUrl=None, lang=None):
|
||||||
add('BloodBound', 'http://bloodboundcomic.com/', 'comic/06112006/')
|
add('BloodBound', 'http://bloodboundcomic.com/', 'comic/06112006/')
|
||||||
add('BroodHollow', 'http://broodhollow.chainsawsuit.com/', 'page/2012/10/06/book-1-curious-little-thing')
|
add('BroodHollow', 'http://broodhollow.chainsawsuit.com/', 'page/2012/10/06/book-1-curious-little-thing')
|
||||||
add('CourtingDisaster', 'http://www.courting-disaster.com/', 'comic/courting-disaster-17/')
|
add('CourtingDisaster', 'http://www.courting-disaster.com/', 'comic/courting-disaster-17/')
|
||||||
|
add('KatzenfutterGeleespritzer', 'http://www.katzenfuttergeleespritzer.de/', 'comics/gert-grendil/', 'de')
|
||||||
add('OnTheEdge', 'http://ontheedgecomics.com/', 'comic/ote0001/')
|
add('OnTheEdge', 'http://ontheedgecomics.com/', 'comic/ote0001/')
|
||||||
add('PandyLand', 'http://pandyland.net/', '1/')
|
add('PandyLand', 'http://pandyland.net/', '1/')
|
||||||
add('Hipsters', 'http://www.hipsters-comic.com/', 'comic/hip01/')
|
add('Hipsters', 'http://www.hipsters-comic.com/', 'comic/hip01/')
|
||||||
|
|
|
@ -8,21 +8,6 @@ from ..util import tagre
|
||||||
from ..helpers import indirectStarter
|
from ..helpers import indirectStarter
|
||||||
|
|
||||||
|
|
||||||
class KatzenfutterGeleespritzer(_BasicScraper):
|
|
||||||
url = 'http://www.katzenfuttergeleespritzer.de/'
|
|
||||||
rurl = escape(url)
|
|
||||||
stripUrl = url + 'comics/%s/'
|
|
||||||
firstStripUrl = stripUrl % 'dont-drink-and-drive'
|
|
||||||
imageSearch = (
|
|
||||||
compile(tagre("img", "src", r'(%swp-content/uploads/\d+/\d+/\d+-\d+-\d+[^"]+)' % rurl)),
|
|
||||||
compile(tagre("img", "src", r'(%swp-content/uploads/\d+/\d+/mmai_404[^"]+)' % rurl)),
|
|
||||||
)
|
|
||||||
# XXX disallowed by robots.txt
|
|
||||||
#prevSearch = compile(tagre("a", "href", r'(%scomics/[^"]+)' % rurl, after="navi-prev"))
|
|
||||||
#help = 'Index format: stripname'
|
|
||||||
lang = 'de'
|
|
||||||
|
|
||||||
|
|
||||||
class KevinAndKell(_BasicScraper):
|
class KevinAndKell(_BasicScraper):
|
||||||
url = 'http://www.kevinandkell.com/'
|
url = 'http://www.kevinandkell.com/'
|
||||||
stripUrl = url + '%s/kk%s%s.html'
|
stripUrl = url + '%s/kk%s%s.html'
|
||||||
|
|
Loading…
Reference in a new issue