Tobias Gruetzmacher 42e43fa4e6 Read starter parameters from class.
This allows to specify starters in a more declarative and dynamic way.
2016-04-12 23:11:39 +02:00

122 lines
4.4 KiB

# -*- coding: utf-8 -*-
# Copyright (C) 2004-2005 Tristan Seligmann and Jonathan Jacobs
# Copyright (C) 2012-2014 Bastian Kleineidam
# Copyright (C) 2015-2016 Tobias Gruetzmacher
from __future__ import absolute_import, division, print_function
from re import compile, escape
from ..scraper import _BasicScraper, _ParserScraper
from ..helpers import bounceStarter, indirectStarter
from ..util import tagre
from .common import _ComicControlScraper, _WordPressScraper, WP_LATEST_SEARCH
class Lackadaisy(_BasicScraper):
baseUrl = ''
url = baseUrl + 'comic.php'
stripUrl = baseUrl + 'comic.php?comicid=%s'
firstStripUrl = stripUrl % '1'
imageSearch = compile(tagre("img", "src", r'(http://www\.lackadaisycats\.com/comic/[^"]*)'))
prevSearch = compile(tagre("a", "href", r"(/comic\.php\?comicid=[0-9]+)") +
"< Previous")
nextSearch = compile(tagre("a", "href", r"(/comic.php\?comicid=[0-9]+)") +
help = 'Index format: n'
starter = bounceStarter()
def namer(cls, imageUrl, pageUrl):
"""Use comic id for filename."""
num = pageUrl.rsplit('=', 1)[-1]
ext = imageUrl.rsplit('.', 1)[-1]
return 'lackadaisy_%s.%s' % (num, ext)
class Laiyu(_WordPressScraper):
url = ''
firstStripUrl = url
latestSearch = WP_LATEST_SEARCH
starter = indirectStarter()
class LasLindas(_BasicScraper):
url = ''
rurl = escape(url)
stripUrl = url + 'comic/%s/'
imageSearch = compile(tagre("img", "src", r'(%swp-content/uploads/[^"]+)' % rurl, after="attachment-full"))
multipleImagesPerStrip = True
prevSearch = compile(tagre("a", "href", r'(%scomic/[^"]+)' % rurl, after="previous"))
help = 'Index format: stripname'
class LastNerdsOnEarth(_ParserScraper):
url = ''
imageSearch = '//div[@id="content"]/a/img'
prevSearch = '//div[@id="comicnav"]/a[last()-2]'
class LeastICouldDo(_BasicScraper):
url = ''
rurl = escape(url)
stripUrl = url + 'comic/%s'
firstStripUrl = stripUrl % '20130109'
imageSearch = compile(tagre("img", "src", r'(%swp-content/uploads/\d+/\d+/\d{8,9}\.\w{1,4})' % rurl))
prevSearch = compile(tagre("a", "href", r'(%scomic/\d+/)' % rurl,
latestSearch = compile(tagre("a", "href", r'(%scomic/\d+/)' % rurl,
starter = indirectStarter()
help = 'Index format: yyyymmdd'
class LetsSpeakEnglish(_ComicControlScraper):
url = ''
class Lint(_BasicScraper):
url = ''
rurl = escape(url)
stripUrl = url + '%s/'
firstStripUrl = stripUrl % '2004/01/10/01102004'
imageSearch = compile(r'<img src="(%scomics/.+?)"' % rurl)
prevSearch = compile(r'\| <a href="([^"]+)" rel="prev">')
help = 'Index format: yyyy/mm/dd/num-name'
class LinuxComFridayFunnies(_BasicScraper):
url = ''
stripUrl = url + '%s'
firstStripUrl = stripUrl % 'the-road-to-japan'
imageSearch = compile(tagre("img", "src", r'(/news/friday-funnies/episode/[^"]+\?format=image[^"]+)'))
prevSearch = compile(tagre("a", "href", r'(/news/friday-funnies/[^"]+)') + "Previous")
help = 'Index format: stripname'
class LittleGamers(_BasicScraper):
url = ''
stripUrl = url + '%s/'
firstStripUrl = stripUrl % '2000/12/01/99'
imageSearch = compile(tagre("img", "src", r'(http://little-gamers\.com/comics/[^"]+)'))
prevSearch = compile(tagre("a", "href", r'(http://www\.little-gamers\.com/[^"]+)', before="comic-nav-prev-link"))
help = 'Index format: yyyy/mm/dd/name'
class LoadingArtist(_ParserScraper):
url = ''
imageSearch = '//div[@class="comic"]//img'
prevSearch = "//a[contains(concat(' ', @class, ' '), ' prev ')]"
class LookingForGroup(_ParserScraper):
url = ''
stripUrl = url + 'page/%s/'
firstStripUrl = stripUrl % '1'
css = True
imageSearch = '#comic img'
prevSearch = '#comic-left > a'
latestSearch = '#header-dropdown-comic-lfg > a:nth-of-type(2)'
starter = indirectStarter()
help = 'Index format: nnn'