dosage/dosagelib/plugins/v.py

# SPDX-License-Identifier: MIT
# Copyright (C) 2004-2008 Tristan Seligmann and Jonathan Jacobs
# Copyright (C) 2012-2014 Bastian Kleineidam
# Copyright (C) 2015-2020 Tobias Gruetzmacher
# Copyright (C) 2019-2020 Daniel Ring
from ..scraper import ParserScraper, _ParserScraper
from ..helpers import bounceStarter, indirectStarter


class Vexxarr(_ParserScraper):
    baseUrl = 'http://www.vexxarr.com/'
    url = baseUrl + 'Index.php'
    stripUrl = baseUrl + 'archive.php?seldate=%s'
    firstStripUrl = stripUrl % '010105'
    imageSearch = '//p/img'
    prevSearch = '//a[./img[contains(@src, "previous")]]'
    nextSearch = '//a[./img[contains(@src, "next")]]'
    starter = bounceStarter

    def namer(self, imageUrl, pageUrl):
        page = pageUrl.rsplit('=', 1)[-1]
        return '20%s-%s-%s' % (page[4:6], page[0:2], page[2:4])


class VGCats(_ParserScraper):
    url = 'https://www.vgcats.com/comics/'
    stripUrl = url + '?strip_id=%s'
    firstStripUrl = stripUrl % '0'
    imageSearch = '//td/img[contains(@src, "images/")]'
    prevSearch = '//a[img[contains(@src, "back.")]]'
    help = 'Index format: n (unpadded)'


class VickiFox(_ParserScraper):
    url = 'http://www.vickifox.com/comic/strip'
    stripUrl = url + '?id=%s'
    firstStripUrl = stripUrl % '001'
    imageSearch = '//img[contains(@src, "comic/")]'
    prevSearch = '//button[@id="btnPrev"]/@value'

    def getPrevUrl(self, url, data):
        return self.stripUrl % self.getPage(url).xpath(self.prevSearch)[0]


class ViiviJaWagner(_ParserScraper):
    url = 'http://www.hs.fi/viivijawagner/'
    imageSearch = '//meta[@property="og:image"]/@content'
    prevSearch = '//a[d:class("prev")]'
    latestSearch = '//div[d:class("cartoon-content")]//a'
    starter = indirectStarter
    lang = 'fi'

    def namer(self, image_url, page_url):
        return page_url.rsplit('-', 1)[1].split('.')[0]


class VirmirWorld(_ParserScraper):
    url = 'http://world.virmir.com/'
    stripUrl = url + 'comic.php?story=%s&page=%s'
    firstStripUrl = stripUrl % ('1', '1')
    imageSearch = '//div[@class="comic"]//img'
    prevSearch = '//a[contains(@class, "prev")]'

    def getIndexStripUrl(self, index):
        index = index.split('-')
        return self.stripUrl % (index[0], index[1])


class Vreakerz(ParserScraper):
    url = 'http://vreakerz.angrykitten.nl/'
    stripUrl = url + 'stories/read/%s'
    firstStripUrl = stripUrl % '1'
    imageSearch = '//img[contains(@src, "storypages")]'
    prevSearch = '//a[@class="btn-prior"]'
Update file headers The default encoding for source files is UTF-8 since Python 3, so we can drop all encoding headers. While we are at it, just replace them with SPDX headers. 2020-04-18 11:45:44 +00:00			`# SPDX-License-Identifier: MIT`
Fixup copyright years. 2016-10-28 22:21:41 +00:00			`# Copyright (C) 2004-2008 Tristan Seligmann and Jonathan Jacobs`
Updated copyright. 2014-01-05 15:50:57 +00:00			`# Copyright (C) 2012-2014 Bastian Kleineidam`
Add self to authors list, update copyright headers 2020-01-13 06:34:05 +00:00			`# Copyright (C) 2015-2020 Tobias Gruetzmacher`
			`# Copyright (C) 2019-2020 Daniel Ring`
Add Vreakerz 2022-12-26 09:28:47 +00:00			`from ..scraper import ParserScraper, _ParserScraper`
Replace xpath_class with custom xpath function 2020-07-31 20:56:30 +00:00			`from ..helpers import bounceStarter, indirectStarter`
Initial commit to Github. 2012-06-20 19:58:13 +00:00

Add Vexxarr 2019-07-15 09:33:32 +00:00			`class Vexxarr(_ParserScraper):`
			`baseUrl = 'http://www.vexxarr.com/'`
			`url = baseUrl + 'Index.php'`
			`stripUrl = baseUrl + 'archive.php?seldate=%s'`
			`firstStripUrl = stripUrl % '010105'`
			`imageSearch = '//p/img'`
			`prevSearch = '//a[./img[contains(@src, "previous")]]'`
			`nextSearch = '//a[./img[contains(@src, "next")]]'`
			`starter = bounceStarter`

			`def namer(self, imageUrl, pageUrl):`
			`page = pageUrl.rsplit('=', 1)[-1]`
			`return '20%s-%s-%s' % (page[4:6], page[0:2], page[2:4])`


Fix VGCats & switch to HTTPS 2020-09-30 19:37:29 +00:00			`class VGCats(_ParserScraper):`
			`url = 'https://www.vgcats.com/comics/'`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`stripUrl = url + '?strip_id=%s'`
Add firstStripUrls. 2013-04-10 21:57:09 +00:00			`firstStripUrl = stripUrl % '0'`
Fix VGCats, VGCats/Adventure, VGCats/Super 2020-12-02 07:40:42 +00:00			`imageSearch = '//td/img[contains(@src, "images/")]'`
Fix VGCats & switch to HTTPS 2020-09-30 19:37:29 +00:00			`prevSearch = '//a[img[contains(@src, "back.")]]'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`help = 'Index format: n (unpadded)'`


Add VickiFox 2019-12-01 01:37:51 +00:00			`class VickiFox(_ParserScraper):`
			`url = 'http://www.vickifox.com/comic/strip'`
			`stripUrl = url + '?id=%s'`
			`firstStripUrl = stripUrl % '001'`
			`imageSearch = '//img[contains(@src, "comic/")]'`
			`prevSearch = '//button[@id="btnPrev"]/@value'`

			`def getPrevUrl(self, url, data):`
			`return self.stripUrl % self.getPage(url).xpath(self.prevSearch)[0]`


Fix a bunch of comic modules. 2016-10-31 05:57:47 +00:00			`class ViiviJaWagner(_ParserScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://www.hs.fi/viivijawagner/'`
Fix ViiviJaWagner. 2017-02-12 19:29:57 +00:00			`imageSearch = '//meta[@property="og:image"]/@content'`
Replace xpath_class with custom xpath function 2020-07-31 20:56:30 +00:00			`prevSearch = '//a[d:class("prev")]'`
			`latestSearch = '//div[d:class("cartoon-content")]//a'`
Fix ViiviJaWagner. 2017-02-12 19:29:57 +00:00			`starter = indirectStarter`
Fix ViiviJaWagner. 2015-04-18 20:45:13 +00:00			`lang = 'fi'`
Fix more comics. 2012-12-07 23:45:18 +00:00
Refactor: Make namer a method. When #42 is realized, the naming of files might differ between comic modules, so the namer's logical location is the instance, not the class. 2016-04-21 06:20:49 +00:00			`def namer(self, image_url, page_url):`
Fix ViiviJaWagner. 2017-02-12 19:29:57 +00:00			`return page_url.rsplit('-', 1)[1].split('.')[0]`
Add VirmirWorld 2019-07-12 07:46:45 +00:00

			`class VirmirWorld(_ParserScraper):`
			`url = 'http://world.virmir.com/'`
			`stripUrl = url + 'comic.php?story=%s&page=%s'`
			`firstStripUrl = stripUrl % ('1', '1')`
			`imageSearch = '//div[@class="comic"]//img'`
			`prevSearch = '//a[contains(@class, "prev")]'`

			`def getIndexStripUrl(self, index):`
			`index = index.split('-')`
			`return self.stripUrl % (index[0], index[1])`
Add Vreakerz 2022-12-26 09:28:47 +00:00

			`class Vreakerz(ParserScraper):`
			`url = 'http://vreakerz.angrykitten.nl/'`
			`stripUrl = url + 'stories/read/%s'`
			`firstStripUrl = stripUrl % '1'`
			`imageSearch = '//img[contains(@src, "storypages")]'`
			`prevSearch = '//a[@class="btn-prior"]'`