2012-06-20 20:41:04 +00:00
|
|
|
# -*- coding: iso-8859-1 -*-
|
|
|
|
# Copyright (C) 2004-2005 Tristan Seligmann and Jonathan Jacobs
|
2012-06-20 19:58:13 +00:00
|
|
|
from re import compile, IGNORECASE
|
|
|
|
|
2012-10-11 10:03:12 +00:00
|
|
|
from ..scraper import _BasicScraper
|
|
|
|
from ..helpers import indirectStarter
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
|
|
|
|
class TalesOfPylea(_BasicScraper):
|
|
|
|
latestUrl = 'http://talesofpylea.com/'
|
2012-11-20 17:53:53 +00:00
|
|
|
stripUrl = latestUrl + '%s/'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(istrip_files/strips/.+?)"')
|
|
|
|
prevSearch = compile(r' <a href="(.+?)">Back</a>')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class TheNoob(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.thenoobcomic.com/index.php'
|
2012-11-20 17:53:53 +00:00
|
|
|
stripUrl = latestUrl + '?pos=%'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(/headquarters/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<a class="comic_nav_previous_button" href="(.+?)"></a>')
|
|
|
|
help = 'Index format: nnnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class TheOrderOfTheStick(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.giantitp.com/'
|
2012-11-20 17:53:53 +00:00
|
|
|
stripUrl = latestUrl + 'comics/images/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<IMG src="(/comics/images/.+?)">')
|
|
|
|
prevSearch = compile(r'<A href="(/comics/oots\d{4}\.html)"><IMG src="/Images/redesign/ComicNav_Back.gif"')
|
|
|
|
help = 'Index format: n (unpadded)'
|
|
|
|
starter = indirectStarter('http://www.giantitp.com/', compile(r'<A href="(/comics/oots\d{4}\.html)"'))
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class TheParkingLotIsFull(_BasicScraper):
|
|
|
|
latestUrl = 'http://plif.courageunfettered.com/archive/arch2002.htm'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://plif.courageunfettered.com/archive/wc%s.gif'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<td align="center"><A TARGET=_parent HREF="(wc\d+\..+?)">')
|
|
|
|
prevSearch = compile(r'-\s*\n\s*<A HREF="(arch\d{4}\.htm)">\d{4}</A>')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class TheWotch(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.thewotch.com/'
|
2012-11-20 17:53:53 +00:00
|
|
|
stripUrl = latestUrl + '?epDate=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r"<img.+?src='(comics/.+?)'")
|
|
|
|
prevSearch = compile(r"<link rel='Previous' href='(\?epDate=\d+-\d+-\d+)'")
|
|
|
|
help = 'Index format: yyyy-mm-dd'
|
|
|
|
|
|
|
|
|
|
|
|
class Thorn(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.mimisgrotto.com/thorn/index.html'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.mimisgrotto.com/thorn/%s.html'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'"(strips/.+?)"')
|
|
|
|
prevSearch = compile(r'(\d[\d][\d].html)">Prev')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class TwoTwoOneFour(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.nitrocosm.com/go/2214_classic/'
|
2012-11-20 17:53:53 +00:00
|
|
|
stripUrl = latestUrl + '%s/'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img class="gallery_display" src="([^"]+)"')
|
|
|
|
prevSearch = compile(r'<a href="([^"]+)"[^>]*><button type="submit" class="nav_btn_previous">')
|
|
|
|
help = 'Index format: n (unpadded)'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class TheWhiteboard(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.the-whiteboard.com/'
|
2012-11-20 17:53:53 +00:00
|
|
|
stripUrl = latestUrl + 'auto%s.html'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img SRC="(autotwb\d{1,4}.+?|autowb\d{1,4}.+?)">', IGNORECASE)
|
|
|
|
prevSearch = compile(r' <a href="(.+?)">previous</a>', IGNORECASE)
|
|
|
|
help = 'Index format: twb or wb + n wg. twb1000'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class _TheFallenAngel(_BasicScraper):
|
|
|
|
imageSearch = compile(r'SRC="(http://www.thefallenangel.co.uk/\w+comics/.+?)"')
|
|
|
|
prevSearch = compile(r' <a href="(http://www.thefallenangel.co.uk/.+?)"><img[^>]+?src="http://www.thefallenangel.co.uk/images/previousday.jpg"')
|
|
|
|
help = 'Index format: yyyymmdd'
|
|
|
|
|
|
|
|
@property
|
|
|
|
def baseUrl(self):
|
|
|
|
return 'http://www.thefallenangel.co.uk/cgi-bin/%sautokeen/autokeenlite.cgi' % (self.shortName,)
|
|
|
|
|
|
|
|
|
|
|
|
@property
|
2012-11-13 18:10:19 +00:00
|
|
|
def stripUrl(self):
|
2012-06-20 19:58:13 +00:00
|
|
|
return self.baseUrl + '?date=%s'
|
|
|
|
|
|
|
|
|
|
|
|
def starter(self):
|
|
|
|
return self.baseUrl
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class HighMaintenance(_TheFallenAngel):
|
|
|
|
name = 'TheFallenAngel/HighMaintenance'
|
|
|
|
shortName = 'hm'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class FAWK(_TheFallenAngel):
|
|
|
|
name = 'TheFallenAngel/FAWK'
|
|
|
|
shortName = 'fawk'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class MalloryChan(_TheFallenAngel):
|
|
|
|
name = 'TheFallenAngel/MalloryChan'
|
|
|
|
shortName = 'mallorychan'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class HMHigh(_BasicScraper):
|
|
|
|
name = 'TheFallenAngel/HMHigh'
|
|
|
|
latestUrl = 'http://www.thefallenangel.co.uk/hmhigh/'
|
2012-11-20 17:53:53 +00:00
|
|
|
stripUrl = latestUrl + '?id=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://www.thefallenangel.co.uk/hmhigh/img/comic/.+?)"')
|
|
|
|
prevSearch = compile(r' <a href="(http://www.thefallenangel.co.uk/.+?)" title=".+?">Prev</a>')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class TheOuterQuarter(_BasicScraper):
|
|
|
|
latestUrl = 'http://theouterquarter.com/'
|
2012-11-20 17:53:53 +00:00
|
|
|
stripUrl = latestUrl + 'comic/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://theouterquarter.com/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<div class="nav-previous"><a href="([^"]+)" rel="prev">')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class TheHorrificAdventuresOfFranky(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.boneyardfranky.com/'
|
2012-11-20 17:53:53 +00:00
|
|
|
stripUrl = latestUrl + '?p=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://www.boneyardfranky.com/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<div class="nav-previous"><a href="(.+?)">')
|
|
|
|
help = 'Index format: nnn'
|