Remove ScurryAndCover, too much JavaScript.
This commit is contained in:
parent
47e2502ec7
commit
69e6318f87
1 changed files with 0 additions and 32 deletions
|
@ -144,38 +144,6 @@ class Science(_BasicScraper):
|
||||||
help = 'Index format: stripname'
|
help = 'Index format: stripname'
|
||||||
|
|
||||||
|
|
||||||
class ScurryAndCover(_ParserScraper):
|
|
||||||
url = 'http://scurry.ink'
|
|
||||||
prevSearch = '//div[@id="prevpage"]/..'
|
|
||||||
nextSearch = '//div[@id="nextpage"]/..'
|
|
||||||
imageSearch = 'MARKER'
|
|
||||||
|
|
||||||
def fetchUrls(self, url, data, urlsearch):
|
|
||||||
if urlsearch != self.imageSearch:
|
|
||||||
return super(ScurryAndCover, self).fetchUrls(url, data, urlsearch)
|
|
||||||
|
|
||||||
# get javascript element and parse a variable value
|
|
||||||
scripts = data.xpath('//body/script[@type="text/javascript"]')
|
|
||||||
|
|
||||||
regex = compile("var fileRoot = '([^']+)")
|
|
||||||
for script in scripts:
|
|
||||||
images = regex.findall(script.text)
|
|
||||||
if len(images) > 0:
|
|
||||||
image = images[0]
|
|
||||||
return [self.url + '/images/pages/' + image + '-xsmall.png']
|
|
||||||
|
|
||||||
def starter(self):
|
|
||||||
"""Go forward as far as possibe, then start."""
|
|
||||||
url = self.url
|
|
||||||
while True:
|
|
||||||
data = self.getPage(url)
|
|
||||||
try:
|
|
||||||
url = self.fetchUrl(url, data, self.nextSearch)
|
|
||||||
except ValueError:
|
|
||||||
break
|
|
||||||
return url
|
|
||||||
|
|
||||||
|
|
||||||
class SequentialArt(_BasicScraper):
|
class SequentialArt(_BasicScraper):
|
||||||
url = 'http://www.collectedcurios.com/sequentialart.php'
|
url = 'http://www.collectedcurios.com/sequentialart.php'
|
||||||
stripUrl = url + '?s=%s'
|
stripUrl = url + '?s=%s'
|
||||||
|
|
Loading…
Reference in a new issue