2016-03-31 21:13:54 +00:00
|
|
|
# -*- coding: utf-8 -*-
|
2016-10-28 22:21:41 +00:00
|
|
|
# Copyright (C) 2004-2008 Tristan Seligmann and Jonathan Jacobs
|
2014-01-05 15:50:57 +00:00
|
|
|
# Copyright (C) 2012-2014 Bastian Kleineidam
|
2017-02-12 19:29:57 +00:00
|
|
|
# Copyright (C) 2015-2017 Tobias Gruetzmacher
|
2012-11-21 20:57:26 +00:00
|
|
|
|
2016-03-31 21:13:54 +00:00
|
|
|
from __future__ import absolute_import, division, print_function
|
2012-11-26 06:13:32 +00:00
|
|
|
from re import compile
|
2012-06-20 19:58:13 +00:00
|
|
|
|
2016-10-31 05:57:47 +00:00
|
|
|
from ..scraper import _BasicScraper, _ParserScraper
|
2017-02-13 21:41:17 +00:00
|
|
|
from ..helpers import indirectStarter, xpath_class
|
2012-11-26 06:13:32 +00:00
|
|
|
from ..util import tagre
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
|
2012-12-02 17:35:06 +00:00
|
|
|
class VGCats(_BasicScraper):
|
2013-02-04 20:00:26 +00:00
|
|
|
url = 'http://www.vgcats.com/comics/'
|
|
|
|
stripUrl = url + '?strip_id=%s'
|
2013-04-10 21:57:09 +00:00
|
|
|
firstStripUrl = stripUrl % '0'
|
2012-12-02 17:35:06 +00:00
|
|
|
imageSearch = compile(tagre("img", "src", r'(images/\d{6}\.[^"]+)'))
|
|
|
|
prevSearch = compile(tagre("a", "href", r'(\?strip_id=\d+)') +
|
2016-03-31 21:13:54 +00:00
|
|
|
tagre("img", "src", r"back\.gif"))
|
2012-06-20 19:58:13 +00:00
|
|
|
help = 'Index format: n (unpadded)'
|
|
|
|
|
|
|
|
|
2012-12-02 17:35:06 +00:00
|
|
|
class VGCatsAdventure(VGCats):
|
2012-06-20 19:58:13 +00:00
|
|
|
name = 'VGCats/Adventure'
|
2013-02-04 20:00:26 +00:00
|
|
|
url = 'http://www.vgcats.com/ffxi/'
|
|
|
|
stripUrl = url + '?strip_id=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
|
2016-03-31 21:13:54 +00:00
|
|
|
class VGCatsSuper(VGCats):
|
|
|
|
name = 'VGCats/Super'
|
|
|
|
url = 'http://www.vgcats.com/super/'
|
|
|
|
stripUrl = url + '?strip_id=%s'
|
|
|
|
|
|
|
|
|
2012-12-08 20:30:51 +00:00
|
|
|
class VictimsOfTheSystem(_BasicScraper):
|
2013-02-04 20:00:26 +00:00
|
|
|
url = 'http://www.votscomic.com/'
|
|
|
|
stripUrl = url + '?id=%s.jpg'
|
2013-04-10 21:57:09 +00:00
|
|
|
firstStripUrl = stripUrl % '070103-002452'
|
2012-12-08 20:30:51 +00:00
|
|
|
imageSearch = compile(tagre("img", "src", r'(comicpro/strips/[^"]+)'))
|
2016-03-31 21:13:54 +00:00
|
|
|
prevSearch = compile(tagre("a", "href", r'(\?id=\d+-\d+\.jpg)') +
|
|
|
|
"Previous")
|
2012-12-08 20:30:51 +00:00
|
|
|
help = 'Index format: nnn-nnn'
|
|
|
|
|
|
|
|
|
2016-10-31 05:57:47 +00:00
|
|
|
class ViiviJaWagner(_ParserScraper):
|
2013-02-04 20:00:26 +00:00
|
|
|
url = 'http://www.hs.fi/viivijawagner/'
|
2017-02-12 19:29:57 +00:00
|
|
|
imageSearch = '//meta[@property="og:image"]/@content'
|
|
|
|
prevSearch = '//a[%s]' % xpath_class('prev')
|
|
|
|
latestSearch = '//div[%s]//a' % xpath_class('cartoon-content')
|
|
|
|
starter = indirectStarter
|
2015-04-18 20:45:13 +00:00
|
|
|
lang = 'fi'
|
2012-12-07 23:45:18 +00:00
|
|
|
|
2016-04-21 06:20:49 +00:00
|
|
|
def namer(self, image_url, page_url):
|
2017-02-12 19:29:57 +00:00
|
|
|
return page_url.rsplit('-', 1)[1].split('.')[0]
|
2019-07-12 07:46:45 +00:00
|
|
|
|
|
|
|
|
|
|
|
class VirmirWorld(_ParserScraper):
|
|
|
|
url = 'http://world.virmir.com/'
|
|
|
|
stripUrl = url + 'comic.php?story=%s&page=%s'
|
|
|
|
firstStripUrl = stripUrl % ('1', '1')
|
|
|
|
imageSearch = '//div[@class="comic"]//img'
|
|
|
|
prevSearch = '//a[contains(@class, "prev")]'
|
|
|
|
|
|
|
|
def getIndexStripUrl(self, index):
|
|
|
|
index = index.split('-')
|
|
|
|
return self.stripUrl % (index[0], index[1])
|