dosage/dosagelib/plugins/w.py

# -*- coding: iso-8859-1 -*-
# Copyright (C) 2004-2005 Tristan Seligmann and Jonathan Jacobs
# Copyright (C) 2012-2013 Bastian Kleineidam

from re import compile, IGNORECASE

from ..scraper import _BasicScraper
from ..util import tagre


class WayfarersMoon(_BasicScraper):
    url = 'http://www.wayfarersmoon.com/'
    stripUrl = url + 'index.php?page=%s'
    imageSearch = compile(r'<img src="(/admin.+?)"')
    prevSearch = compile(r'<a href="(.+?)".+?btn_back.gif')
    help = 'Index format: nn'


class WastedTalent(_BasicScraper):
    url = 'http://www.wastedtalent.ca/'
    stripUrl = url + 'comic/%s'
    imageSearch = compile(tagre("img", "src", r'(http://www\.wastedtalent\.ca/sites/default/files/imagecache/comic_full/comics/\d+/[^"]+)'))
    prevSearch = compile(tagre("a", "href", r'(/comic/[^"]+)', after="comic_prev"))
    help = 'Index format: stripname'


class WhiteNinja(_BasicScraper):
    url = 'http://www.whiteninjacomics.com/comics.shtml'
    stripUrl = 'http://www.whiteninjacomics.com/comics/%s.shtml'
    imageSearch = compile(r'<img src=(/images/comics/(?!t-).+?\.gif) border=0')
    prevSearch = compile(r'(/comics/.+?shtml).+?previous')
    help = 'Index format: s (comic name)'


class WhiteNoise(_BasicScraper):
    url = 'http://www.wncomic.com/archive.php'
    stripUrl = 'http://www.wncomic.com/archive_comments.php?strip_id=%s'
    imageSearch = compile(r'(istrip_files/strips/.+?)"')
    prevSearch = compile(r'First .+?"(archive.+?)".+?top_back')
    help = 'Index format: n'


class WhyTheLongFace(_BasicScraper):
    url = 'http://www.absurdnotions.org/wtlf200709.html'
    stripUrl = 'http://www.absurdnotions.org/wtlf%s.html'
    imageSearch = compile(r'<img src="(http://www.absurdnotions.org/wtlf.+?|lf\d+.\w{1,4})"', IGNORECASE)
    multipleImagesPerStrip = True
    prevSearch = compile(r'HREF="(.+?)"><IMG SRC="nprev.gif" ')
    help = 'Index format: yyyymm'


class Wigu(_BasicScraper):
    url = 'http://wigucomics.com/'
    stripUrl = url + 'adventures/index.php?comic=%s'
    imageSearch = compile(tagre("img", "src", r'(/adventures/comics/[^"]+)'))
    prevSearch = compile(tagre("a", "href", r'(/adventures/index\.php\?comic=\d+)', after="go back"))
    help = 'Index format: n'


class Wonderella(_BasicScraper):
    url = 'http://nonadventures.com/'
    stripUrl = url + '%s/'
    imageSearch = compile(tagre("img", "src", r'(http://nonadventures\.com/comics/[^"]+)'))
    prevSearch = compile(tagre("a", "href", r'(http://nonadventures\.com/\d+/\d+/\d+/[^"]+)', after="prev"))
    help = 'Index format: yyyy/mm/dd/name'


class WotNow(_BasicScraper):
    url = 'http://shadowburn.binmode.com/wotnow/'
    stripUrl = url + 'comic.php?comic_id=%s'
    imageSearch = compile(r'<IMG SRC="(comics/.+?)"')
    prevSearch = compile(r'<A HREF="(.+?)"><IMG SRC="images/b_prev.gif" ')
    help = 'Index format: n (unpadded)'


# XXX disallowed by robots.txt
class _WorldOfWarcraftEh(_BasicScraper):
    url = 'http://woweh.com/'
    stripUrl = None
    imageSearch = compile(r'http://woweh.com/(comics/.+?)"')
    prevSearch = compile(r'woweh.com/(\?p=.+:?)".+:?="prev')


class Wulffmorgenthaler(_BasicScraper):
    url = 'http://wumocomicstrip.com/'
    stripUrl = url + '%s/'
    imageSearch = compile(tagre("img", "src", r'(/img/strip/[^/"]+)'))
    prevSearch = compile(tagre("a", "href", r'([^"]+)') + "<span>Previous")
    help = 'Index format: yyyy/mm/dd'


class WhiteNoise(_BasicScraper):
    url = 'http://www.wncomic.com/archive.php'
    stripUrl = 'http://www.wncomic.com/archive_comments.php?strip_id=%s'
    imageSearch = compile(r'(istrip_files/strips/.+?)"')
    prevSearch = compile(r'</a><a href="(.+?)"><img src="images/top_back.jpg" ')
    help = 'Index format: n'


class WapsiSquare(_BasicScraper):
    url = 'http://wapsisquare.com/'
    stripUrl = url + 'comic/%s'
    imageSearch = compile(r'<img src="(http://wapsisquare.com/comics/.+?)"')
    prevSearch = compile(r'<a href="(.+?)"[^>]+?>Previous</a>')
    help = 'Index format: strip-name'


class WeCanSleepTomorrow(_BasicScraper):
    url = 'http://wecansleeptomorrow.com/'
    stripUrl = url + '%s/'
    imageSearch = compile(tagre("img", "src", r'(http://wecansleeptomorrow\.com/comics/[^"]+)'))
    prevSearch = compile(tagre("a", "href", r'(http://wecansleeptomorrow\.com/[^"]+)', after="prev"))
    help = 'Index format: yyyy/mm/dd/stripname'


class Wondermark(_BasicScraper):
    url = 'http://wondermark.com/'
    stripUrl = url + '%s/'
    imageSearch = compile(r'<img src="(http://wondermark.com/c/.+?)"')
    prevSearch = compile(r'<a href="(.+?)" rel="prev">')
    help = 'Index format: nnn'
Updated copyright for all source files. 2012-06-20 20:41:04 +00:00			`# -- coding: iso-8859-1 --`
			`# Copyright (C) 2004-2005 Tristan Seligmann and Jonathan Jacobs`
Rename latestUrl in url 2013-02-05 18:51:46 +00:00			`# Copyright (C) 2012-2013 Bastian Kleineidam`
Fix some comics. 2012-11-21 20:57:26 +00:00
Fix some comics. 2012-11-26 06:13:32 +00:00			`from re import compile, IGNORECASE`
Initial commit to Github. 2012-06-20 19:58:13 +00:00
A lot of refactoring. 2012-10-11 10:03:12 +00:00			`from ..scraper import _BasicScraper`
Fix some comics. 2012-11-26 06:13:32 +00:00			`from ..util import tagre`
Initial commit to Github. 2012-06-20 19:58:13 +00:00

			`class WayfarersMoon(_BasicScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://www.wayfarersmoon.com/'`
			`stripUrl = url + 'index.php?page=%s'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`imageSearch = compile(r'<img src="(/admin.+?)"')`
			`prevSearch = compile(r'<a href="(.+?)".+?btn_back.gif')`
			`help = 'Index format: nn'`


Added some comics. 2013-02-06 21:08:36 +00:00			`class WastedTalent(_BasicScraper):`
			`url = 'http://www.wastedtalent.ca/'`
			`stripUrl = url + 'comic/%s'`
			`imageSearch = compile(tagre("img", "src", r'(http://www\.wastedtalent\.ca/sites/default/files/imagecache/comic_full/comics/\d+/[^"]+)'))`
			`prevSearch = compile(tagre("a", "href", r'(/comic/[^"]+)', after="comic_prev"))`
			`help = 'Index format: stripname'`


Initial commit to Github. 2012-06-20 19:58:13 +00:00			`class WhiteNinja(_BasicScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://www.whiteninjacomics.com/comics.shtml'`
Rename imageUrl to stripUrl. 2012-11-13 18:10:19 +00:00			`stripUrl = 'http://www.whiteninjacomics.com/comics/%s.shtml'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`imageSearch = compile(r'<img src=(/images/comics/(?!t-).+?\.gif) border=0')`
			`prevSearch = compile(r'(/comics/.+?shtml).+?previous')`
			`help = 'Index format: s (comic name)'`


			`class WhiteNoise(_BasicScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://www.wncomic.com/archive.php'`
Rename imageUrl to stripUrl. 2012-11-13 18:10:19 +00:00			`stripUrl = 'http://www.wncomic.com/archive_comments.php?strip_id=%s'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`imageSearch = compile(r'(istrip_files/strips/.+?)"')`
			`prevSearch = compile(r'First .+?"(archive.+?)".+?top_back')`
			`help = 'Index format: n'`


			`class WhyTheLongFace(_BasicScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://www.absurdnotions.org/wtlf200709.html'`
Rename imageUrl to stripUrl. 2012-11-13 18:10:19 +00:00			`stripUrl = 'http://www.absurdnotions.org/wtlf%s.html'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`imageSearch = compile(r'<img src="(http://www.absurdnotions.org/wtlf.+?\|lf\d+.\w{1,4})"', IGNORECASE)`
Fix comics. 2012-12-04 06:02:40 +00:00			`multipleImagesPerStrip = True`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`prevSearch = compile(r'HREF="(.+?)"><IMG SRC="nprev.gif" ')`
			`help = 'Index format: yyyymm'`


			`class Wigu(_BasicScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://wigucomics.com/'`
			`stripUrl = url + 'adventures/index.php?comic=%s'`
Fix some comics. 2012-11-26 06:13:32 +00:00			`imageSearch = compile(tagre("img", "src", r'(/adventures/comics/[^"]+)'))`
			`prevSearch = compile(tagre("a", "href", r'(/adventures/index\.php\?comic=\d+)', after="go back"))`
			`help = 'Index format: n'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00

Added some comics. 2013-02-06 21:08:36 +00:00			`class Wonderella(_BasicScraper):`
			`url = 'http://nonadventures.com/'`
			`stripUrl = url + '%s/'`
			`imageSearch = compile(tagre("img", "src", r'(http://nonadventures\.com/comics/[^"]+)'))`
			`prevSearch = compile(tagre("a", "href", r'(http://nonadventures\.com/\d+/\d+/\d+/[^"]+)', after="prev"))`
			`help = 'Index format: yyyy/mm/dd/name'`


Initial commit to Github. 2012-06-20 19:58:13 +00:00			`class WotNow(_BasicScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://shadowburn.binmode.com/wotnow/'`
			`stripUrl = url + 'comic.php?comic_id=%s'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`imageSearch = compile(r'<IMG SRC="(comics/.+?)"')`
			`prevSearch = compile(r'<A HREF="(.+?)"><IMG SRC="images/b_prev.gif" ')`
			`help = 'Index format: n (unpadded)'`


Various comics are fixed. 2012-12-13 20:05:27 +00:00			`# XXX disallowed by robots.txt`
			`class _WorldOfWarcraftEh(_BasicScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://woweh.com/'`
Updated documentation and fix some comics. 2012-11-20 17:53:53 +00:00			`stripUrl = None`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`imageSearch = compile(r'http://woweh.com/(comics/.+?)"')`
			`prevSearch = compile(r'woweh.com/(\?p=.+:?)".+:?="prev')`


			`class Wulffmorgenthaler(_BasicScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://wumocomicstrip.com/'`
			`stripUrl = url + '%s/'`
Fix comics. 2012-12-04 06:02:40 +00:00			`imageSearch = compile(tagre("img", "src", r'(/img/strip/[^/"]+)'))`
Fix some comics. 2012-11-26 06:13:32 +00:00			`prevSearch = compile(tagre("a", "href", r'([^"]+)') + "<span>Previous")`
			`help = 'Index format: yyyy/mm/dd'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00

			`class WhiteNoise(_BasicScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://www.wncomic.com/archive.php'`
Rename imageUrl to stripUrl. 2012-11-13 18:10:19 +00:00			`stripUrl = 'http://www.wncomic.com/archive_comments.php?strip_id=%s'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`imageSearch = compile(r'(istrip_files/strips/.+?)"')`
			`prevSearch = compile(r'</a><a href="(.+?)"><img src="images/top_back.jpg" ')`
			`help = 'Index format: n'`


			`class WapsiSquare(_BasicScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://wapsisquare.com/'`
			`stripUrl = url + 'comic/%s'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`imageSearch = compile(r'<img src="(http://wapsisquare.com/comics/.+?)"')`
			`prevSearch = compile(r'<a href="(.+?)"[^>]+?>Previous</a>')`
			`help = 'Index format: strip-name'`


			`class WeCanSleepTomorrow(_BasicScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://wecansleeptomorrow.com/'`
			`stripUrl = url + '%s/'`
Fix some comics. 2012-11-26 06:13:32 +00:00			`imageSearch = compile(tagre("img", "src", r'(http://wecansleeptomorrow\.com/comics/[^"]+)'))`
			`prevSearch = compile(tagre("a", "href", r'(http://wecansleeptomorrow\.com/[^"]+)', after="prev"))`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`help = 'Index format: yyyy/mm/dd/stripname'`


			`class Wondermark(_BasicScraper):`
Always have an url attribute in comic scrapers. 2013-02-04 20:00:26 +00:00			`url = 'http://wondermark.com/'`
			`stripUrl = url + '%s/'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`imageSearch = compile(r'<img src="(http://wondermark.com/c/.+?)"')`
			`prevSearch = compile(r'<a href="(.+?)" rel="prev">')`
			`help = 'Index format: nnn'`