# -*- coding: utf-8 -*- # Copyright (C) 2004-2005 Tristan Seligmann and Jonathan Jacobs # Copyright (C) 2012-2014 Bastian Kleineidam # Copyright (C) 2015-2016 Tobias Gruetzmacher from __future__ import absolute_import, division, print_function from re import compile, escape from ..scraper import _BasicScraper, _ParserScraper from ..helpers import bounceStarter, indirectStarter from ..util import tagre from .common import _ComicControlScraper, _WordPressScraper, WP_LATEST_SEARCH class Lackadaisy(_BasicScraper): baseUrl = 'http://lackadaisy.foxprints.com/' url = baseUrl + 'comic.php' stripUrl = baseUrl + 'comic.php?comicid=%s' firstStripUrl = stripUrl % '1' imageSearch = compile(tagre("img", "src", r'(http://www\.lackadaisycats\.com/comic/[^"]*)')) prevSearch = compile(tagre("a", "href", r"(/comic\.php\?comicid=[0-9]+)") + "< Previous") nextSearch = compile(tagre("a", "href", r"(/comic.php\?comicid=[0-9]+)") + "Next") help = 'Index format: n' starter = bounceStarter @classmethod def namer(cls, imageUrl, pageUrl): """Use comic id for filename.""" num = pageUrl.rsplit('=', 1)[-1] ext = imageUrl.rsplit('.', 1)[-1] return 'lackadaisy_%s.%s' % (num, ext) class Laiyu(_WordPressScraper): url = 'http://www.flowerlarkstudios.com/comic/preliminary-concepts/welcome/' firstStripUrl = url latestSearch = WP_LATEST_SEARCH starter = indirectStarter class LasLindas(_BasicScraper): url = 'http://laslindas.katbox.net/' rurl = escape(url) stripUrl = url + 'comic/%s/' imageSearch = compile(tagre("img", "src", r'(%swp-content/uploads/[^"]+)' % rurl, after="attachment-full")) multipleImagesPerStrip = True prevSearch = compile(tagre("a", "href", r'(%scomic/[^"]+)' % rurl, after="previous")) help = 'Index format: stripname' class LastNerdsOnEarth(_ParserScraper): url = 'http://www.lastnerdsonearth.com/latest/' imageSearch = '//div[@id="content"]/a/img' prevSearch = '//div[@id="comicnav"]/a[last()-2]' class LeastICouldDo(_BasicScraper): url = 'http://www.leasticoulddo.com/' rurl = escape(url) stripUrl = url + 'comic/%s' firstStripUrl = stripUrl % '20130109' imageSearch = compile(tagre("img", "src", r'(%swp-content/uploads/\d+/\d+/\d{8,9}\.\w{1,4})' % rurl)) prevSearch = compile(tagre("a", "href", r'(%scomic/\d+/)' % rurl, after="Previous")) latestSearch = compile(tagre("a", "href", r'(%scomic/\d+/)' % rurl, after="feature-comic")) starter = indirectStarter help = 'Index format: yyyymmdd' class LetsSpeakEnglish(_ComicControlScraper): url = 'http://www.marycagle.com' class LittleGamers(_BasicScraper): url = 'http://www.little-gamers.com/' stripUrl = url + '%s/' firstStripUrl = stripUrl % '2000/12/01/99' imageSearch = compile(tagre("img", "src", r'(http://little-gamers\.com/comics/[^"]+)')) prevSearch = compile(tagre("a", "href", r'(http://www\.little-gamers\.com/[^"]+)', before="comic-nav-prev-link")) help = 'Index format: yyyy/mm/dd/name' class LoadingArtist(_ParserScraper): url = 'http://www.loadingartist.com/comic/new-update/' imageSearch = '//div[@class="comic"]//img' prevSearch = "//a[contains(concat(' ', @class, ' '), ' prev ')]" class LookingForGroup(_ParserScraper): url = 'http://www.lfgcomic.com/' stripUrl = url + 'page/%s/' firstStripUrl = stripUrl % '1' css = True imageSearch = '#comic img' prevSearch = '#comic-left > a' latestSearch = '#header-dropdown-comic-lfg > a:nth-of-type(2)' starter = indirectStarter help = 'Index format: nnn'