dosage/dosagelib/plugins/w.py

# SPDX-License-Identifier: MIT
# SPDX-FileCopyrightText: © 2004 Tristan Seligmann and Jonathan Jacobs
# SPDX-FileCopyrightText: © 2012 Bastian Kleineidam
# SPDX-FileCopyrightText: © 2015 Tobias Gruetzmacher
# SPDX-FileCopyrightText: © 2019 Daniel Ring
from re import compile, escape, IGNORECASE

from ..scraper import ParserScraper, _BasicScraper, _ParserScraper
from ..util import tagre
from ..helpers import bounceStarter
from .common import ComicControlScraper, WordPressScraper, WordPressNaviIn, WordPressWebcomic


class WapsiSquare(WordPressNaviIn):
    url = 'http://wapsisquare.com/'
    firstStripUrl = url + 'comic/09092001/'

    def shouldSkipUrl(self, url, data):
        """Skip pages without images."""
        return self.match(data, '//iframe')  # videos


class WastedTalent(_ParserScraper):
    url = 'http://www.wastedtalent.ca/'
    stripUrl = url + 'comic/%s'
    firstStripUrl = stripUrl % 'anime-crack'
    imageSearch = '//div[d:class("comic_content")]/img'
    prevSearch = '//li[d:class("previous")]/a'
    multipleImagesPerStrip = True


class WebcomicName(_ParserScraper):
    url = 'https://webcomicname.com/'
    imageSearch = '//figure[d:class("tmblr-full")]//img'
    prevSearch = '//a[d:class("next")]'
    multipleImagesPerStrip = True


class Weregeek(ParserScraper):
    url = 'http://www.weregeek.com/'
    stripUrl = url + 'comic/%s/'
    firstStripUrl = stripUrl % 'comic-1'
    imageSearch = '//div[d:class("webcomic-media")]//img'
    prevSearch = '//a[d:class("previous-webcomic-link")]'


class WereIWolf(_ParserScraper):
    stripUrl = 'https://wolfwares.ca/comics/Were I wolf/strip2.php?name=%s&start=%s'
    url = stripUrl % ('4 Black and White - part 3', 'latest')
    firstStripUrl = stripUrl % ('1 Sirens', '0')
    imageSearch = '//img[contains(@src, "ROW")]'
    prevSearch = '//a[./img[contains(@src, "previous")]]'
    multipleImagesPerStrip = True
    endOfLife = True
    chapters = ('1 Sirens',
                '2 Black and White',
                '3 Black and White - Princess and Knight',
                '4 Black and White - part 3')

    def namer(self, imageUrl, pageUrl):
        # Prepend chapter number to image filename
        for chapter in self.chapters:
            if chapter in pageUrl:
                chapterNum = chapter[0]
        return chapterNum + '_' + imageUrl.rsplit('/', 1)[-1]

    def getPrevUrl(self, url, data):
        # Fix missing navigation links between chapters
        if url == self.stripUrl % (self.chapters[3], '0'):
            return self.stripUrl % (self.chapters[2], 'latest')
        if url == self.stripUrl % (self.chapters[2], '0'):
            return self.stripUrl % (self.chapters[1], 'latest')
        if url == self.stripUrl % (self.chapters[1], '0'):
            return self.stripUrl % (self.chapters[0], 'latest')
        return super(WereIWolf, self).getPrevUrl(url, data)

    def getIndexStripUrl(self, index):
        # Get comic strip URL from index
        index = index.split('-')
        return self.stripUrl % (index[0], index[1])


class WhiteNoise(WordPressWebcomic):
    url = 'http://whitenoisecomic.com/'
    stripUrl = url + 'comic/%s/'
    firstStripUrl = stripUrl % 'book-one'
    imageSearch = '//div[@id="comic"]//img'


class WhiteNoiseLee(ComicControlScraper):
    url = 'http://www.white-noise-comic.com/'
    stripUrl = url + 'comic/%s'
    firstStripUrl = stripUrl % '1-0'
    starter = bounceStarter

    def namer(self, imageUrl, pageUrl):
        return pageUrl.rsplit('/', 1)[-1] + '.' + imageUrl.rsplit('.', 1)[-1]


class Whomp(ComicControlScraper):
    url = 'http://www.whompcomic.com/'
    firstStripUrl = url + 'comic/06152010'
    textSearch = '//img[@id="cc-comic"]/@title'


class WhyTheLongFace(_BasicScraper):
    baseUrl = 'http://www.absurdnotions.org/'
    rurl = escape(baseUrl)
    url = baseUrl + 'wtlf200709.html'
    stripUrl = baseUrl + 'wtlf%s.html'
    firstStripUrl = stripUrl % '200306'
    imageSearch = compile(r'<img src="(%swtlf.+?|lf\d+.\w{1,4})"' % rurl,
                          IGNORECASE)
    multipleImagesPerStrip = True
    prevSearch = compile(r'HREF="(.+?)"><IMG SRC="nprev.gif" ')
    help = 'Index format: yyyymm'


class Widdershins(ComicControlScraper):
    url = 'https://widdershinscomic.com/'
    stripUrl = url + 'wdshn/%s'
    firstStripUrl = stripUrl % 'sleight-of-hand-cover'
    starter = bounceStarter

    def namer(self, imageUrl, pageUrl):
        return pageUrl.rsplit('/', 1)[-1] + '.' + imageUrl.rsplit('.', 1)[-1]


class Wigu(_ParserScraper):
    stripUrl = 'http://www.wigucomics.com/adventures/index.php?comic=%s'
    url = stripUrl % '-1'
    firstStripUrl = stripUrl % '1'
    imageSearch = '//div[@id="comic"]//img[contains(@src, "/comics/")]'
    prevSearch = '//a[@alt="go back"]'
    endOfLife = True
    help = 'Index format: n'


class WildeLife(ComicControlScraper):
    url = 'http://www.wildelifecomic.com/'
    stripUrl = url + 'comic/%s'
    firstStripUrl = stripUrl % '1'


class Wolfpac(WordPressScraper):
    url = 'https://wolfpac.ca/'
    firstStripUrl = url + 'archives/comic/wolfpac-title'


class Wonderella(_BasicScraper):
    url = 'http://nonadventures.com/'
    rurl = escape(url)
    stripUrl = url + '%s/'
    firstStripUrl = stripUrl % '2006/09/09/the-torment-of-a-thousand-yesterdays'
    imageSearch = compile(tagre("div", "id", r"comic", quote=r'["\']') +
                          r"\s*" +
                          tagre("img", "src", r'(%scomics/[^"]+)' % rurl))
    prevSearch = compile(tagre("a", "href", r'(%s\d+/\d+/\d+/[^"]+)' % rurl,
                               after="prev"))
    help = 'Index format: yyyy/mm/dd/name'


class Wondermark(WordPressScraper):
    url = 'http://wondermark.com/'
    stripUrl = url + '%s/'
    firstStripUrl = stripUrl % '001'
    prevSearch = '//a[@rel="prev"]'
    help = 'Index format: nnn (001-999), 1knn (1000-1099), cnnnn (1100-)'


class WorldOfMrToast(_BasicScraper):
    baseUrl = 'http://www.theimaginaryworld.com/'
    url = baseUrl + 'mrTcomicA.html'
    imageSearch = compile(tagre("img", "src", r'(comic[^"]+)'))
    # list the archive links since there is no prev/next navigation
    prevurls = (
        url,
        baseUrl + 'mrTcomicW02.html',
        baseUrl + 'mrTcomicW01.html',
        baseUrl + 'mrGcomic03.html',
        baseUrl + 'mrGcomic02.html',
        baseUrl + 'mrGcomic01.html',
        baseUrl + 'mrTcomicT05.html',
        baseUrl + 'mrTcomicT04.html',
        baseUrl + 'mrTcomicT03.html',
        baseUrl + 'mrTcomicT02.html',
        baseUrl + 'mrTcomicT01.html',
        baseUrl + 'mrTcomicIW3.html',
        baseUrl + 'mrTcomicIW2.html',
        baseUrl + 'mrTcomicIW1.html',
    )
    firstStripUrl = prevurls[-1]
    multipleImagesPerStrip = True
    endOfLife = True

    def getPrevUrl(self, url, data):
        idx = self.prevurls.index(url)
        try:
            return self.prevurls[idx + 1]
        except IndexError:
            return None


class WormWorldSaga(_BasicScraper):
    url = 'http://www.wormworldsaga.com/'
    stripUrl = url + 'chapters/%s/index.php'
    firstStripUrl = stripUrl % 'chapter01/EN'
    imageSearch = (
        compile(tagre("img", "src", r'(images/CH\d+_\d+\.[^"]+)')),
        compile(tagre("img", "src", r'(panels/CH\d+_[^"]+)')),
    )
    latestChapter = 5
    multipleImagesPerStrip = True

    def starter(self):
        return '%schapters/chapter%02d/%s/index.php' % (
            self.url, self.latestChapter, self.lang.upper())

    def getPrevUrl(self, url, data):
        """Find previous URL."""
        if 'chapter04' in url:
            return url.replace('chapter04', 'chapter03')
        if 'chapter03' in url:
            return url.replace('chapter03', 'chapter02')
        if 'chapter02' in url:
            return url.replace('chapter02', 'chapter01')
        return None


class WormWorldSagaFrench(WormWorldSaga):
    lang = 'fr'


class WormWorldSagaGerman(WormWorldSaga):
    lang = 'de'


class WormWorldSagaSpanish(WormWorldSaga):
    lang = 'es'
Update file headers The default encoding for source files is UTF-8 since Python 3, so we can drop all encoding headers. While we are at it, just replace them with SPDX headers. 2020-04-18 11:45:44 +00:00			`# SPDX-License-Identifier: MIT`
Unify XPath NS config over modules 2024-03-17 20:44:46 +00:00			`# SPDX-FileCopyrightText: © 2004 Tristan Seligmann and Jonathan Jacobs`
			`# SPDX-FileCopyrightText: © 2012 Bastian Kleineidam`
			`# SPDX-FileCopyrightText: © 2015 Tobias Gruetzmacher`
			`# SPDX-FileCopyrightText: © 2019 Daniel Ring`
Use re.escape and add some firstStripUrl. 2013-04-10 16:19:11 +00:00			`from re import compile, escape, IGNORECASE`
Initial commit to Github. 2012-06-20 19:58:13 +00:00
Fix Weregeek 2023-06-07 04:03:36 +00:00			`from ..scraper import ParserScraper, _BasicScraper, _ParserScraper`
Fix some comics. 2012-11-26 06:13:32 +00:00			`from ..util import tagre`
Remove WebDesignerCOTW 2020-09-30 19:13:11 +00:00			`from ..helpers import bounceStarter`
Add Wolfpac 2022-06-06 13:00:56 +00:00			`from .common import ComicControlScraper, WordPressScraper, WordPressNaviIn, WordPressWebcomic`
Initial commit to Github. 2012-06-20 19:58:13 +00:00

Deprecate underscore-prefixed parent classes This is trying to strike a balance between updating as much existing classes as possible, but not making the diff too big... 2022-06-06 10:08:32 +00:00			`class WapsiSquare(WordPressNaviIn):`
Sort comics. 2013-03-06 19:21:10 +00:00			`url = 'http://wapsisquare.com/'`
Fix some more comic modules. 2016-05-16 21:16:29 +00:00			`firstStripUrl = url + 'comic/09092001/'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00
Skip videos for WapsiSquare 2020-09-30 19:17:46 +00:00			`def shouldSkipUrl(self, url, data):`
			`"""Skip pages without images."""`
Unify XPath NS config over modules 2024-03-17 20:44:46 +00:00			`return self.match(data, '//iframe') # videos`
Skip videos for WapsiSquare 2020-09-30 19:17:46 +00:00
Initial commit to Github. 2012-06-20 19:58:13 +00:00
Switch WastedTalent to ParserScraper 2020-09-30 19:24:01 +00:00			`class WastedTalent(_ParserScraper):`
Added some comics. 2013-02-06 21:08:36 +00:00			`url = 'http://www.wastedtalent.ca/'`
			`stripUrl = url + 'comic/%s'`
Add firstStripUrls. 2013-04-10 21:57:09 +00:00			`firstStripUrl = stripUrl % 'anime-crack'`
Switch WastedTalent to ParserScraper 2020-09-30 19:24:01 +00:00			`imageSearch = '//div[d:class("comic_content")]/img'`
			`prevSearch = '//li[d:class("previous")]/a'`
			`multipleImagesPerStrip = True`
Added some comics. 2013-02-06 21:08:36 +00:00

Add WebcomicName 2020-04-19 21:42:27 +00:00			`class WebcomicName(_ParserScraper):`
			`url = 'https://webcomicname.com/'`
Replace xpath_class with custom xpath function 2020-07-31 20:56:30 +00:00			`imageSearch = '//figure[d:class("tmblr-full")]//img'`
			`prevSearch = '//a[d:class("next")]'`
Add WebcomicName 2020-04-19 21:42:27 +00:00			`multipleImagesPerStrip = True`


Fix Weregeek 2023-06-07 04:03:36 +00:00			`class Weregeek(ParserScraper):`
Added EdmundFinney, Gaia, GaiaGerman, InternetWebcomic, NotInventedHere, RedsPlanet, RomanticallyApocalyptic, ScandinaviaAndTheWorld, TheGamerCat, Weregeek 2013-12-10 18:50:21 +00:00			`url = 'http://www.weregeek.com/'`
Fix Weregeek 2023-06-07 04:03:36 +00:00			`stripUrl = url + 'comic/%s/'`
			`firstStripUrl = stripUrl % 'comic-1'`
			`imageSearch = '//div[d:class("webcomic-media")]//img'`
			`prevSearch = '//a[d:class("previous-webcomic-link")]'`
Added EdmundFinney, Gaia, GaiaGerman, InternetWebcomic, NotInventedHere, RedsPlanet, RomanticallyApocalyptic, ScandinaviaAndTheWorld, TheGamerCat, Weregeek 2013-12-10 18:50:21 +00:00

Add WereIWolf 2019-07-13 07:49:31 +00:00			`class WereIWolf(_ParserScraper):`
			`stripUrl = 'https://wolfwares.ca/comics/Were I wolf/strip2.php?name=%s&start=%s'`
			`url = stripUrl % ('4 Black and White - part 3', 'latest')`
			`firstStripUrl = stripUrl % ('1 Sirens', '0')`
			`imageSearch = '//img[contains(@src, "ROW")]'`
			`prevSearch = '//a[./img[contains(@src, "previous")]]'`
			`multipleImagesPerStrip = True`
			`endOfLife = True`
			`chapters = ('1 Sirens',`
			`'2 Black and White',`
			`'3 Black and White - Princess and Knight',`
			`'4 Black and White - part 3')`

			`def namer(self, imageUrl, pageUrl):`
			`# Prepend chapter number to image filename`
			`for chapter in self.chapters:`
			`if chapter in pageUrl:`
			`chapterNum = chapter[0]`
			`return chapterNum + '_' + imageUrl.rsplit('/', 1)[-1]`

			`def getPrevUrl(self, url, data):`
			`# Fix missing navigation links between chapters`
			`if url == self.stripUrl % (self.chapters[3], '0'):`
			`return self.stripUrl % (self.chapters[2], 'latest')`
			`if url == self.stripUrl % (self.chapters[2], '0'):`
			`return self.stripUrl % (self.chapters[1], 'latest')`
			`if url == self.stripUrl % (self.chapters[1], '0'):`
			`return self.stripUrl % (self.chapters[0], 'latest')`
			`return super(WereIWolf, self).getPrevUrl(url, data)`

			`def getIndexStripUrl(self, index):`
			`# Get comic strip URL from index`
			`index = index.split('-')`
			`return self.stripUrl % (index[0], index[1])`


Deprecate underscore-prefixed parent classes This is trying to strike a balance between updating as much existing classes as possible, but not making the diff too big... 2022-06-06 10:08:32 +00:00			`class WhiteNoise(WordPressWebcomic):`
Fix some more comic modules. 2016-05-16 21:16:29 +00:00			`url = 'http://whitenoisecomic.com/'`
Fix WhiteNoise 2019-10-19 22:27:43 +00:00			`stripUrl = url + 'comic/%s/'`
			`firstStripUrl = stripUrl % 'book-one'`
Add common handler for mgsisk's Wordpress Webcomic plugin 2019-10-18 07:49:55 +00:00			`imageSearch = '//div[@id="comic"]//img'`
Sort entries. 2013-04-10 16:36:33 +00:00

Deprecate underscore-prefixed parent classes This is trying to strike a balance between updating as much existing classes as possible, but not making the diff too big... 2022-06-06 10:08:32 +00:00			`class WhiteNoiseLee(ComicControlScraper):`
Add WhiteNoiseLee 2019-06-21 07:54:45 +00:00			`url = 'http://www.white-noise-comic.com/'`
			`stripUrl = url + 'comic/%s'`
			`firstStripUrl = stripUrl % '1-0'`
			`starter = bounceStarter`

			`def namer(self, imageUrl, pageUrl):`
			`return pageUrl.rsplit('/', 1)[-1] + '.' + imageUrl.rsplit('.', 1)[-1]`


Deprecate underscore-prefixed parent classes This is trying to strike a balance between updating as much existing classes as possible, but not making the diff too big... 2022-06-06 10:08:32 +00:00			`class Whomp(ComicControlScraper):`
Added Whomp. 2014-06-24 18:48:49 +00:00			`url = 'http://www.whompcomic.com/'`
Move more comics to common WordPressScraper. 2016-04-10 21:04:34 +00:00			`firstStripUrl = url + 'comic/06152010'`
			`textSearch = '//img[@id="cc-comic"]/@title'`
Added Whomp. 2014-06-24 18:48:49 +00:00

Initial commit to Github. 2012-06-20 19:58:13 +00:00			`class WhyTheLongFace(_BasicScraper):`
s/baseurl/baseUrl/g 2013-04-13 18:58:00 +00:00			`baseUrl = 'http://www.absurdnotions.org/'`
			`rurl = escape(baseUrl)`
			`url = baseUrl + 'wtlf200709.html'`
			`stripUrl = baseUrl + 'wtlf%s.html'`
Add firstStripUrls. 2013-04-10 21:57:09 +00:00			`firstStripUrl = stripUrl % '200306'`
Sort comics alphabetically & PEP8 style fixes. 2016-03-31 21:13:54 +00:00			`imageSearch = compile(r'<img src="(%swtlf.+?\|lf\d+.\w{1,4})"' % rurl,`
			`IGNORECASE)`
Fix comics. 2012-12-04 06:02:40 +00:00			`multipleImagesPerStrip = True`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`prevSearch = compile(r'HREF="(.+?)"><IMG SRC="nprev.gif" ')`
			`help = 'Index format: yyyymm'`


Remove old location for Widdershins 2022-06-06 14:48:39 +00:00			`class Widdershins(ComicControlScraper):`
Support Widdershins as it no longer updates GoComics (#225) [Widdershins stopped updating on GoComics in December 2020](https://www.gocomics.com/widdershins/2020/12/08). However, the comic has been [regularly updated since](https://www.widdershinscomic.com/wdshn/may-20th-2022) on the main comic site. This commit adds a plugin for the main site. I've verified that it can scrape all comics, including recent ones not on GoComics. 2022-06-06 14:46:14 +00:00			`url = 'https://widdershinscomic.com/'`
			`stripUrl = url + 'wdshn/%s'`
			`firstStripUrl = stripUrl % 'sleight-of-hand-cover'`
			`starter = bounceStarter`

			`def namer(self, imageUrl, pageUrl):`
			`return pageUrl.rsplit('/', 1)[-1] + '.' + imageUrl.rsplit('.', 1)[-1]`


Fix some more comic modules. 2016-05-16 21:16:29 +00:00			`class Wigu(_ParserScraper):`
			`stripUrl = 'http://www.wigucomics.com/adventures/index.php?comic=%s'`
			`url = stripUrl % '-1'`
Add firstStripUrls. 2013-04-10 21:57:09 +00:00			`firstStripUrl = stripUrl % '1'`
Fix some more comic modules. 2016-05-16 21:16:29 +00:00			`imageSearch = '//div[@id="comic"]//img[contains(@src, "/comics/")]'`
			`prevSearch = '//a[@alt="go back"]'`
			`endOfLife = True`
Fix some comics. 2012-11-26 06:13:32 +00:00			`help = 'Index format: n'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00

Deprecate underscore-prefixed parent classes This is trying to strike a balance between updating as much existing classes as possible, but not making the diff too big... 2022-06-06 10:08:32 +00:00			`class WildeLife(ComicControlScraper):`
Add WildeLife 2019-07-02 07:23:52 +00:00			`url = 'http://www.wildelifecomic.com/'`
			`stripUrl = url + 'comic/%s'`
			`firstStripUrl = stripUrl % '1'`


Add Wolfpac 2022-06-06 13:00:56 +00:00			`class Wolfpac(WordPressScraper):`
			`url = 'https://wolfpac.ca/'`
			`firstStripUrl = url + 'archives/comic/wolfpac-title'`


Added some comics. 2013-02-06 21:08:36 +00:00			`class Wonderella(_BasicScraper):`
			`url = 'http://nonadventures.com/'`
Use re.escape and add some firstStripUrl. 2013-04-10 16:19:11 +00:00			`rurl = escape(url)`
Added some comics. 2013-02-06 21:08:36 +00:00			`stripUrl = url + '%s/'`
Add firstStripUrls. 2013-04-10 21:57:09 +00:00			`firstStripUrl = stripUrl % '2006/09/09/the-torment-of-a-thousand-yesterdays'`
Sort comics alphabetically & PEP8 style fixes. 2016-03-31 21:13:54 +00:00			`imageSearch = compile(tagre("div", "id", r"comic", quote=r'["\']') +`
			`r"\s*" +`
			`tagre("img", "src", r'(%scomics/[^"]+)' % rurl))`
			`prevSearch = compile(tagre("a", "href", r'(%s\d+/\d+/\d+/[^"]+)' % rurl,`
			`after="prev"))`
Added some comics. 2013-02-06 21:08:36 +00:00			`help = 'Index format: yyyy/mm/dd/name'`


Fix Wondermark 2022-06-06 14:22:31 +00:00			`class Wondermark(WordPressScraper):`
Sort entries. 2013-04-10 16:36:33 +00:00			`url = 'http://wondermark.com/'`
			`stripUrl = url + '%s/'`
Add firstStripUrls. 2013-04-10 21:57:09 +00:00			`firstStripUrl = stripUrl % '001'`
Fix Wondermark 2022-06-06 14:22:31 +00:00			`prevSearch = '//a[@rel="prev"]'`
			`help = 'Index format: nnn (001-999), 1knn (1000-1099), cnnnn (1100-)'`
Sort entries. 2013-04-10 16:36:33 +00:00

Added some comic strips and cleanup the scraper code. 2013-03-06 19:00:30 +00:00			`class WorldOfMrToast(_BasicScraper):`
s/baseurl/baseUrl/g 2013-04-13 18:58:00 +00:00			`baseUrl = 'http://www.theimaginaryworld.com/'`
			`url = baseUrl + 'mrTcomicA.html'`
Added some comic strips and cleanup the scraper code. 2013-03-06 19:00:30 +00:00			`imageSearch = compile(tagre("img", "src", r'(comic[^"]+)'))`
			`# list the archive links since there is no prev/next navigation`
			`prevurls = (`
			`url,`
s/baseurl/baseUrl/g 2013-04-13 18:58:00 +00:00			`baseUrl + 'mrTcomicW02.html',`
			`baseUrl + 'mrTcomicW01.html',`
			`baseUrl + 'mrGcomic03.html',`
			`baseUrl + 'mrGcomic02.html',`
			`baseUrl + 'mrGcomic01.html',`
			`baseUrl + 'mrTcomicT05.html',`
			`baseUrl + 'mrTcomicT04.html',`
			`baseUrl + 'mrTcomicT03.html',`
			`baseUrl + 'mrTcomicT02.html',`
			`baseUrl + 'mrTcomicT01.html',`
			`baseUrl + 'mrTcomicIW3.html',`
			`baseUrl + 'mrTcomicIW2.html',`
			`baseUrl + 'mrTcomicIW1.html',`
Added some comic strips and cleanup the scraper code. 2013-03-06 19:00:30 +00:00			`)`
			`firstStripUrl = prevurls[-1]`
			`multipleImagesPerStrip = True`
Fix some more comic modules. 2016-05-16 21:16:29 +00:00			`endOfLife = True`
Added some comic strips and cleanup the scraper code. 2013-03-06 19:00:30 +00:00
Fix some more comic modules. 2016-05-16 21:16:29 +00:00			`def getPrevUrl(self, url, data):`
Added some comic strips and cleanup the scraper code. 2013-03-06 19:00:30 +00:00			`idx = self.prevurls.index(url)`
			`try:`
Move more comics to common WordPressScraper. 2016-04-10 21:04:34 +00:00			`return self.prevurls[idx + 1]`
Added some comic strips and cleanup the scraper code. 2013-03-06 19:00:30 +00:00			`except IndexError:`
			`return None`


Added some comics, fixed some. 2013-03-21 17:33:16 +00:00			`class WormWorldSaga(_BasicScraper):`
			`url = 'http://www.wormworldsaga.com/'`
			`stripUrl = url + 'chapters/%s/index.php'`
			`firstStripUrl = stripUrl % 'chapter01/EN'`
			`imageSearch = (`
			`compile(tagre("img", "src", r'(images/CH\d+_\d+\.[^"]+)')),`
			`compile(tagre("img", "src", r'(panels/CH\d+_[^"]+)')),`
			`)`
Updated wormworld chapter. 2013-04-30 04:42:49 +00:00			`latestChapter = 5`
Added some comics, fixed some. 2013-03-21 17:33:16 +00:00			`multipleImagesPerStrip = True`

Refactor: Convert starter to simple method. 2016-04-13 18:01:51 +00:00			`def starter(self):`
Added some comics, fixed some. 2013-03-21 17:33:16 +00:00			`return '%schapters/chapter%02d/%s/index.php' % (`
Refactor: Convert starter to simple method. 2016-04-13 18:01:51 +00:00			`self.url, self.latestChapter, self.lang.upper())`
Added some comics, fixed some. 2013-03-21 17:33:16 +00:00
fixed WormWorldSaga 2015-05-31 23:45:22 +00:00			`def getPrevUrl(self, url, data):`
Added some comics, fixed some. 2013-03-21 17:33:16 +00:00			`"""Find previous URL."""`
			`if 'chapter04' in url:`
			`return url.replace('chapter04', 'chapter03')`
			`if 'chapter03' in url:`
			`return url.replace('chapter03', 'chapter02')`
			`if 'chapter02' in url:`
			`return url.replace('chapter02', 'chapter01')`
			`return None`


Sort comics alphabetically & PEP8 style fixes. 2016-03-31 21:13:54 +00:00			`class WormWorldSagaFrench(WormWorldSaga):`
			`lang = 'fr'`


Added some comics, fixed some. 2013-03-21 17:33:16 +00:00			`class WormWorldSagaGerman(WormWorldSaga):`
			`lang = 'de'`

Sort comics alphabetically & PEP8 style fixes. 2016-03-31 21:13:54 +00:00
Added some comics, fixed some. 2013-03-21 17:33:16 +00:00			`class WormWorldSagaSpanish(WormWorldSaga):`
			`lang = 'es'`