Updated GirlGenius to new markup
GG markup has changed, so I fixed the prevSearch regex to find the "previous" button on the redesigned page. As well, I set multipleImagesPerStrip to true, since there are quite a few comics with multiple images that were being discarded.
This commit is contained in:
parent
94090da813
commit
236b840363
1 changed files with 3 additions and 3 deletions
|
@ -111,11 +111,11 @@ class GirlGenius(_BasicScraper):
|
||||||
stripUrl = url + '?date=%s'
|
stripUrl = url + '?date=%s'
|
||||||
firstStripUrl = stripUrl % '20021104'
|
firstStripUrl = stripUrl % '20021104'
|
||||||
imageSearch = compile(tagre("img", "src", r"(%sggmain/strips/[^']*)" % rurl, quote="'"))
|
imageSearch = compile(tagre("img", "src", r"(%sggmain/strips/[^']*)" % rurl, quote="'"))
|
||||||
prevSearch = compile(tagre("a", "href", r"(%s[^']+)" % rurl, quote="'") +
|
prevSearch = compile(tagre("a", "id", "topprev", quote="\"",
|
||||||
tagre("img", "alt", "The Previous Comic", quote="'"))
|
before=r"(%s[^\"']+)" % rurl))
|
||||||
|
multipleImagesPerStrip = True
|
||||||
help = 'Index format: yyyymmdd'
|
help = 'Index format: yyyymmdd'
|
||||||
|
|
||||||
|
|
||||||
class GirlsWithSlingshots(_BasicScraper):
|
class GirlsWithSlingshots(_BasicScraper):
|
||||||
url = 'http://www.girlswithslingshots.com/'
|
url = 'http://www.girlswithslingshots.com/'
|
||||||
rurl = escape(url)
|
rurl = escape(url)
|
||||||
|
|
Loading…
Reference in a new issue