s/baseurl/baseUrl/g
This commit is contained in:
parent
c246b41d64
commit
f15f993851
15 changed files with 119 additions and 119 deletions
|
@ -18,9 +18,9 @@ class AbleAndBaker(_BasicScraper):
|
|||
|
||||
|
||||
class AbsurdNotions(_BasicScraper):
|
||||
baseurl = 'http://www.absurdnotions.org/'
|
||||
url = baseurl + 'page129.html'
|
||||
stripUrl = baseurl + 'page%s.html'
|
||||
baseUrl = 'http://www.absurdnotions.org/'
|
||||
url = baseUrl + 'page129.html'
|
||||
stripUrl = baseUrl + 'page%s.html'
|
||||
firstStripUrl = stripUrl % '1'
|
||||
imageSearch = compile(tagre('img', 'src', r'(an[^"]+)'))
|
||||
multipleImagesPerStrip = True
|
||||
|
@ -74,9 +74,9 @@ class AetheriaEpics(_BasicScraper):
|
|||
|
||||
|
||||
class AfterStrife(_BasicScraper):
|
||||
baseurl = 'http://afterstrife.com/'
|
||||
rurl = escape(baseurl)
|
||||
stripUrl = baseurl + '?p=%s'
|
||||
baseUrl = 'http://afterstrife.com/'
|
||||
rurl = escape(baseUrl)
|
||||
stripUrl = baseUrl + '?p=%s'
|
||||
url = stripUrl % '262'
|
||||
firstStripUrl = stripUrl % '1'
|
||||
imageSearch = compile(r'<img src="(%sstrips/.+?)"' % rurl)
|
||||
|
@ -148,9 +148,9 @@ class AlienLovesPredator(_BasicScraper):
|
|||
|
||||
|
||||
class AlienShores(_BasicScraper):
|
||||
baseurl = 'http://alienshores.com/'
|
||||
rurl = escape(baseurl)
|
||||
url = baseurl + 'alienshores_band/'
|
||||
baseUrl = 'http://alienshores.com/'
|
||||
rurl = escape(baseUrl)
|
||||
url = baseUrl + 'alienshores_band/'
|
||||
stripUrl = url + '%s'
|
||||
imageSearch = compile(tagre("img", "src", r'(%salienshores_band/wp-content/uploads/[^"]+)' % rurl))
|
||||
prevSearch = compile(tagre("a", "href", r'(%s[^"]+)' % rurl, after="prev"))
|
||||
|
@ -258,10 +258,10 @@ class Angels2200(_BasicScraper):
|
|||
|
||||
|
||||
class Annyseed(_BasicScraper):
|
||||
baseurl = 'http://www.colourofivy.com/'
|
||||
rurl = escape(baseurl)
|
||||
url = baseurl + 'annyseed_webcomic_latest.htm'
|
||||
stripUrl = baseurl + 'annyseed_webcomic%s.htm'
|
||||
baseUrl = 'http://www.colourofivy.com/'
|
||||
rurl = escape(baseUrl)
|
||||
url = baseUrl + 'annyseed_webcomic_latest.htm'
|
||||
stripUrl = baseUrl + 'annyseed_webcomic%s.htm'
|
||||
imageSearch = compile(tagre("img", "src", r'(Annyseed[^"]+)'))
|
||||
prevSearch = compile(r'<a href="(%s[^"]+)"><img src="Last.gif"' % rurl)
|
||||
help = 'Index format: nnn'
|
||||
|
@ -297,11 +297,11 @@ class ASofterWorld(_BasicScraper):
|
|||
|
||||
|
||||
class AstronomyPOTD(_BasicScraper):
|
||||
baseurl = 'http://antwrp.gsfc.nasa.gov/apod/'
|
||||
url = baseurl + 'astropix.html'
|
||||
baseUrl = 'http://antwrp.gsfc.nasa.gov/apod/'
|
||||
url = baseUrl + 'astropix.html'
|
||||
starter = bounceStarter(url,
|
||||
compile(tagre("a", "href", r'(ap\d{6}\.html)') + "></a>"))
|
||||
stripUrl = baseurl + 'ap%s.html'
|
||||
stripUrl = baseUrl + 'ap%s.html'
|
||||
firstStripUrl = stripUrl % '061012'
|
||||
imageSearch = compile(tagre("a", "href", r'(image/\d{4}/[^"]+)'))
|
||||
multipleImagesPerStrip = True
|
||||
|
|
|
@ -101,11 +101,11 @@ class ChainsawSuit(_BasicScraper):
|
|||
|
||||
|
||||
class Champ2010(_BasicScraper):
|
||||
baseurl = 'http://jedcollins.com/champ2010/'
|
||||
rurl = escape(baseurl)
|
||||
baseUrl = 'http://jedcollins.com/champ2010/'
|
||||
rurl = escape(baseUrl)
|
||||
# the latest URL is hard coded since the comic is discontinued
|
||||
url = baseurl + 'champ-12-30-10.html'
|
||||
stripUrl = baseurl + '%s.html'
|
||||
url = baseUrl + 'champ-12-30-10.html'
|
||||
stripUrl = baseUrl + '%s.html'
|
||||
firstStripUrl = stripUrl % 'champ1-1-10-fuck'
|
||||
imageSearch = compile(tagre("img", "src", r'(%scomics/[^"]+)' % rurl))
|
||||
prevSearch = compile(tagre("a", "href", r'(%s[^"]+)' % rurl, after="Previous"))
|
||||
|
@ -323,9 +323,9 @@ class CrimsonDark(_BasicScraper):
|
|||
|
||||
class CraftedFables(_BasicScraper):
|
||||
url = 'http://www.craftedfables.com/'
|
||||
baseurl = 'http://www.caf-fiends.net/'
|
||||
rurl = escape(baseurl)
|
||||
stripUrl = baseurl + 'craftedfables/?p=%s'
|
||||
baseUrl = 'http://www.caf-fiends.net/'
|
||||
rurl = escape(baseUrl)
|
||||
stripUrl = baseUrl + 'craftedfables/?p=%s'
|
||||
imageSearch = compile(tagre("img", "src", r'(%scraftedfables/comics/[^"]+)' % rurl))
|
||||
prevSearch = compile(tagre("a", "href", r'(%scraftedfables/[^"]+)' % rurl) +
|
||||
tagre("span", "class", r"prev"))
|
||||
|
|
|
@ -9,12 +9,12 @@ from ..util import tagre
|
|||
_imageSearch = compile(tagre("a", "href", r'(/comics/\d+/[^"]+)'))
|
||||
|
||||
def add(name, path):
|
||||
baseurl = 'http://www.creators.com'
|
||||
baseUrl = 'http://www.creators.com'
|
||||
classname = 'Creators_%s' % name
|
||||
globals()[classname] = make_scraper(classname,
|
||||
name = 'Creators/' + name,
|
||||
url = baseurl + path + '.html',
|
||||
stripUrl = baseurl + path + '/%s.html',
|
||||
url = baseUrl + path + '.html',
|
||||
stripUrl = baseUrl + path + '/%s.html',
|
||||
lang = 'es' if name.lower().endswith('spanish') else 'en',
|
||||
imageSearch = _imageSearch,
|
||||
prevSearch = compile(tagre("a", "href", r'(%s/\d+\.html)' % path) +
|
||||
|
|
|
@ -258,9 +258,9 @@ class DresdenCodak(_BasicScraper):
|
|||
|
||||
|
||||
class DrFun(_BasicScraper):
|
||||
baseurl = 'http://www.ibiblio.org/Dave/'
|
||||
url = baseurl + 'ar00502.htm'
|
||||
stripUrl = baseurl + 'ar%s.htm'
|
||||
baseUrl = 'http://www.ibiblio.org/Dave/'
|
||||
url = baseUrl + 'ar00502.htm'
|
||||
stripUrl = baseUrl + 'ar%s.htm'
|
||||
firstStripUrl = stripUrl % '00001'
|
||||
imageSearch = compile(tagre("a", "href", r'(Dr-Fun/df\d+/df[^"]+)'))
|
||||
multipleImagesPerStrip = True
|
||||
|
@ -280,9 +280,9 @@ class DrMcNinja(_BasicScraper):
|
|||
|
||||
|
||||
class Drowtales(_BasicScraper):
|
||||
baseurl = 'http://www.drowtales.com/'
|
||||
rurl = escape(baseurl)
|
||||
url = baseurl + 'mainarchive.php'
|
||||
baseUrl = 'http://www.drowtales.com/'
|
||||
rurl = escape(baseUrl)
|
||||
url = baseUrl + 'mainarchive.php'
|
||||
stripUrl = url + '?sid=%s'
|
||||
firstStripUrl = stripUrl % '4192'
|
||||
imageSearch = (
|
||||
|
|
|
@ -19,9 +19,9 @@ class FalconTwin(_BasicScraper):
|
|||
|
||||
|
||||
class Fallen(_BasicScraper):
|
||||
baseurl = 'http://www.fallencomic.com/'
|
||||
url = baseurl + 'fal-page.htm'
|
||||
stripUrl = baseurl + 'pages/part%s/%s-p%s.htm'
|
||||
baseUrl = 'http://www.fallencomic.com/'
|
||||
url = baseUrl + 'fal-page.htm'
|
||||
stripUrl = baseUrl + 'pages/part%s/%s-p%s.htm'
|
||||
imageSearch = compile(r'<IMG SRC="(page/.+?)"', IGNORECASE)
|
||||
prevSearch = compile(r'<A HREF="(.+?)"><FONT FACE="Courier">Back', IGNORECASE)
|
||||
help = 'Index format: nn-m (comicNumber-partNumber)'
|
||||
|
@ -59,9 +59,9 @@ class FauxPas(_BasicScraper):
|
|||
|
||||
|
||||
class FeyWinds(_BasicScraper):
|
||||
baseurl = 'http://kitsune.rydia.net/'
|
||||
url = baseurl + 'index.html'
|
||||
stripUrl = baseurl + 'comic/page.php?id=%s'
|
||||
baseUrl = 'http://kitsune.rydia.net/'
|
||||
url = baseUrl + 'index.html'
|
||||
stripUrl = baseUrl + 'comic/page.php?id=%s'
|
||||
imageSearch = compile(r"(../comic/pages//.+?)'")
|
||||
prevSearch = compile(r"(page.php\?id=.+?)'.+?navprevious.png")
|
||||
help = 'Index format: n (unpadded)'
|
||||
|
@ -89,9 +89,9 @@ class FirstWorldProblems(_BasicScraper):
|
|||
|
||||
|
||||
class FlakyPastry(_BasicScraper):
|
||||
baseurl = 'http://flakypastry.runningwithpencils.com/'
|
||||
url = baseurl + 'index.php'
|
||||
stripUrl = baseurl + 'comic.php?strip_id=%s'
|
||||
baseUrl = 'http://flakypastry.runningwithpencils.com/'
|
||||
url = baseUrl + 'index.php'
|
||||
stripUrl = baseUrl + 'comic.php?strip_id=%s'
|
||||
firstStripUrl = stripUrl % '0'
|
||||
imageSearch = compile(r'<img src="(comics/.+?)"')
|
||||
prevSearch = compile(r'<a href="(.+?)".+?btn_back')
|
||||
|
|
|
@ -20,12 +20,12 @@ class Galaxion(_BasicScraper):
|
|||
|
||||
|
||||
class Garanos(_BasicScraper):
|
||||
baseurl = 'http://garanos.alexheberling.com/'
|
||||
rurl = escape(baseurl)
|
||||
url = baseurl + 'pages/page-1/'
|
||||
baseUrl = 'http://garanos.alexheberling.com/'
|
||||
rurl = escape(baseUrl)
|
||||
url = baseUrl + 'pages/page-1/'
|
||||
starter = indirectStarter(url,
|
||||
compile(tagre("a", "href", r'(%spages/[^"]+)' % rurl, after="navi-last")))
|
||||
stripUrl = baseurl + 'pages/page-%s'
|
||||
stripUrl = baseUrl + 'pages/page-%s'
|
||||
imageSearch = compile(tagre("img", "src", r'(%scomics/[^"]+)' % rurl))
|
||||
prevSearch = compile(tagre("a", "href", r'(%spages/[^"]+)' % rurl, after="prev"))
|
||||
help = 'Index format: n (unpadded)'
|
||||
|
|
|
@ -35,9 +35,9 @@ class KevinAndKell(_BasicScraper):
|
|||
|
||||
|
||||
class Key(_BasicScraper):
|
||||
baseurl = 'http://key.shadilyn.com/'
|
||||
url = baseurl + 'latestpage.html'
|
||||
stripUrl = baseurl + 'pages/%s.html'
|
||||
baseUrl = 'http://key.shadilyn.com/'
|
||||
url = baseUrl + 'latestpage.html'
|
||||
stripUrl = baseUrl + 'pages/%s.html'
|
||||
imageSearch = compile(r'"((?:images/.+?)|(?:pages/images/.+?))"')
|
||||
prevSearch = compile(r'</a><a href="(.+?html)".+?prev')
|
||||
help = 'Index format: nnn'
|
||||
|
@ -54,9 +54,9 @@ class KickInTheHead(_BasicScraper):
|
|||
|
||||
|
||||
class KillerKomics(_BasicScraper):
|
||||
baseurl = 'http://www.killerkomics.com/web-comics/'
|
||||
url = baseurl + 'index_ang.cfm'
|
||||
stripUrl = baseurl + '%s.cfm'
|
||||
baseUrl = 'http://www.killerkomics.com/web-comics/'
|
||||
url = baseUrl + 'index_ang.cfm'
|
||||
stripUrl = baseUrl + '%s.cfm'
|
||||
imageSearch = compile(r'<img src="(http://www.killerkomics.com/FichiersUpload/Comics/.+?)"')
|
||||
prevSearch = compile(r'<div id="precedent"><a href="(.+?)"')
|
||||
help = 'Index format: strip-name'
|
||||
|
@ -82,9 +82,9 @@ class Krakow(_BasicScraper):
|
|||
|
||||
|
||||
class Kukuburi(_BasicScraper):
|
||||
baseurl = 'http://www.kukuburi.com/'
|
||||
url = baseurl + 'current/'
|
||||
stripUrl = baseurl + 'v2/%s/'
|
||||
baseUrl = 'http://www.kukuburi.com/'
|
||||
url = baseUrl + 'current/'
|
||||
stripUrl = baseUrl + 'v2/%s/'
|
||||
firstStripUrl = stripUrl % '2007/08/09/one'
|
||||
imageSearch = compile(tagre("img", "src", r'(http://www\.kukuburi\.com/v2/comics/[^"]+)', after='alt="[^"]'))
|
||||
prevSearch = compile(r'nav-previous.+?"(http.+?)"')
|
||||
|
|
|
@ -141,10 +141,10 @@ class NobodyScores(_BasicScraper):
|
|||
|
||||
|
||||
class NoNeedForBushido(_BasicScraper):
|
||||
baseurl = 'http://noneedforbushido.com/'
|
||||
rurl = escape(baseurl)
|
||||
url = baseurl + 'latest/'
|
||||
stripUrl = baseurl + '%s/'
|
||||
baseUrl = 'http://noneedforbushido.com/'
|
||||
rurl = escape(baseUrl)
|
||||
url = baseUrl + 'latest/'
|
||||
stripUrl = baseUrl + '%s/'
|
||||
imageSearch = compile(tagre("img", "src", r'(%scomics/comic/[^"]+)' % rurl))
|
||||
prevSearch = compile(tagre("a", "href", r'(%s[^"]+)' % rurl, after="previous-comic-link"))
|
||||
help = 'Index format: yyyy/comic/nnn'
|
||||
|
|
|
@ -50,9 +50,9 @@ class PartiallyClips(_BasicScraper):
|
|||
|
||||
|
||||
class PastelDefender(_BasicScraper):
|
||||
baseurl = 'http://www.pasteldefender.com/'
|
||||
url = baseurl + 'coverbackcover.html'
|
||||
stripUrl = baseurl + '%s.html'
|
||||
baseUrl = 'http://www.pasteldefender.com/'
|
||||
url = baseUrl + 'coverbackcover.html'
|
||||
stripUrl = baseUrl + '%s.html'
|
||||
firstStripUrl = stripUrl % 'cover'
|
||||
imageSearch = compile(r'<IMG SRC="(images/.+?)" WIDTH="742"')
|
||||
prevSearch = compile(r'<A HREF="([^"]+)"><IMG SRC="images/back\.gif"')
|
||||
|
@ -107,9 +107,9 @@ class PeppermintSaga(_BasicScraper):
|
|||
|
||||
|
||||
class PHDComics(_BasicScraper):
|
||||
baseurl = 'http://phdcomics.com/'
|
||||
url = baseurl + 'comics.php'
|
||||
stripUrl = baseurl + 'comics/archive.php?comicid=%s'
|
||||
baseUrl = 'http://phdcomics.com/'
|
||||
url = baseUrl + 'comics.php'
|
||||
stripUrl = baseUrl + 'comics/archive.php?comicid=%s'
|
||||
firstStripUrl = stripUrl % '1'
|
||||
imageSearch = compile(tagre("img", "src", r'(http://www\.phdcomics\.com/comics/archive/phd[^ ]+)', quote=""))
|
||||
prevSearch = compile(tagre("a", "href", r'((?:comics/)?archive\.php\?comicid=\d+)', quote="") +
|
||||
|
@ -167,9 +167,9 @@ class _PlanescapeSurvival(_BasicScraper):
|
|||
|
||||
|
||||
class PokeyThePenguin(_BasicScraper):
|
||||
baseurl = 'http://www.yellow5.com/pokey/archive/'
|
||||
url = baseurl + 'index558.html'
|
||||
stripUrl = baseurl + 'index%s.html'
|
||||
baseUrl = 'http://www.yellow5.com/pokey/archive/'
|
||||
url = baseUrl + 'index558.html'
|
||||
stripUrl = baseUrl + 'index%s.html'
|
||||
firstStripUrl = stripUrl % '1'
|
||||
imageSearch = compile(tagre("img", "src", r'(pokey\d+[^"]+)'))
|
||||
prevSearch = True
|
||||
|
|
|
@ -17,9 +17,9 @@ class QuestionableContent(_BasicScraper):
|
|||
|
||||
|
||||
class Qwantz(_BasicScraper):
|
||||
baseurl = 'http://www.qwantz.com/'
|
||||
url = baseurl + 'index.php'
|
||||
rurl = escape(baseurl)
|
||||
baseUrl = 'http://www.qwantz.com/'
|
||||
url = baseUrl + 'index.php'
|
||||
rurl = escape(baseUrl)
|
||||
stripUrl = url + '?comic=%s'
|
||||
firstStripUrl = stripUrl % '1'
|
||||
imageSearch = compile(tagre("img", "src", r'(%scomics/[^"]+)' % rurl))
|
||||
|
|
|
@ -35,10 +35,10 @@ class RealmOfAtland(_BasicScraper):
|
|||
|
||||
|
||||
class RedMeat(_BasicScraper):
|
||||
baseurl = 'http://www.redmeat.com/redmeat/'
|
||||
url = baseurl + 'current/index.html'
|
||||
baseUrl = 'http://www.redmeat.com/redmeat/'
|
||||
url = baseUrl + 'current/index.html'
|
||||
starter = bounceStarter(url, compile(r'<a href="(\.\./\d{4}-\d{2}-\d{2}/index\.html)">next</a>'))
|
||||
stripUrl = baseurl + '%s/index.html'
|
||||
stripUrl = baseUrl + '%s/index.html'
|
||||
firstStripUrl = stripUrl % '1996-06-10'
|
||||
imageSearch = compile(r'<img src="(index-1\.gif)" width="\d+" height="\d+" [^>]*>')
|
||||
prevSearch = compile(r'<a href="(\.\./\d{4}-\d{2}-\d{2}/index\.html)">previous</a>')
|
||||
|
|
|
@ -316,9 +316,9 @@ class SodiumEyes(_BasicScraper):
|
|||
|
||||
class Sorcery101(_BasicScraper):
|
||||
description = u'Welcome to the site of Kel McDonald, professional comic illustrator and writer.'
|
||||
baseurl = 'http://www.sorcery101.net/'
|
||||
url = baseurl + 'sorcery-101/'
|
||||
rurl = escape(baseurl)
|
||||
baseUrl = 'http://www.sorcery101.net/'
|
||||
url = baseUrl + 'sorcery-101/'
|
||||
rurl = escape(baseUrl)
|
||||
stripUrl = url + '%s/'
|
||||
imageSearch = compile(tagre("img", "src", r'(%swp-content/uploads/\d+/\d+/[^"]+)' % rurl))
|
||||
prevSearch = compile(tagre("a", "href", r'(%ssorcery-101/[^"]+)' % rurl, after="previous-"))
|
||||
|
@ -475,10 +475,10 @@ class SomethingPositive(_BasicScraper):
|
|||
|
||||
class StarCrossdDestiny(_BasicScraper):
|
||||
description = u'Furturistic fantasy. A group of outcasts fight to survive in a world that shuns them as freaks.'
|
||||
baseurl = 'http://www.starcrossd.net/'
|
||||
rurl = escape(baseurl)
|
||||
url = baseurl + 'comic.html'
|
||||
stripUrl = baseurl + 'archives/%s.html'
|
||||
baseUrl = 'http://www.starcrossd.net/'
|
||||
rurl = escape(baseUrl)
|
||||
url = baseUrl + 'comic.html'
|
||||
stripUrl = baseUrl + 'archives/%s.html'
|
||||
firstStripUrl = stripUrl % '00000001'
|
||||
imageSearch = compile(tagre("img", "src", r'(%s(?:ch1|strips|book2)/[^"]+)' % rurl))
|
||||
prevSearch = compile(r'<a href="(%s(?:ch1/)?archives/\d+\.html)"[^>]*"[^"]*"[^>]*>prev' % rurl, IGNORECASE)
|
||||
|
|
|
@ -37,14 +37,14 @@ class TheNoob(_BasicScraper):
|
|||
|
||||
|
||||
class TheOrderOfTheStick(_BasicScraper):
|
||||
baseurl = 'http://www.giantitp.com/'
|
||||
url = baseurl + 'comics/oots0863.html'
|
||||
stripUrl = baseurl + 'comics/oots%s.html'
|
||||
baseUrl = 'http://www.giantitp.com/'
|
||||
url = baseUrl + 'comics/oots0863.html'
|
||||
stripUrl = baseUrl + 'comics/oots%s.html'
|
||||
firstStripUrl = stripUrl % '0001'
|
||||
imageSearch = compile(r'<IMG src="(/comics/images/[^"]+)">')
|
||||
prevSearch = compile(r'<A href="(/comics/oots\d{4}\.html)"><IMG src="/Images/redesign/ComicNav_Back.gif"')
|
||||
help = 'Index format: n (unpadded)'
|
||||
starter = indirectStarter(baseurl, compile(r'<A href="(/comics/oots\d{4}\.html)"'))
|
||||
starter = indirectStarter(baseUrl, compile(r'<A href="(/comics/oots\d{4}\.html)"'))
|
||||
|
||||
@classmethod
|
||||
def namer(cls, imageUrl, pageUrl):
|
||||
|
@ -52,9 +52,9 @@ class TheOrderOfTheStick(_BasicScraper):
|
|||
|
||||
|
||||
class TheParkingLotIsFull(_BasicScraper):
|
||||
baseurl = 'http://plif.courageunfettered.com/'
|
||||
url = baseurl + 'archive/arch2002.htm'
|
||||
stripUrl = baseurl + 'archive/arch%s.htm'
|
||||
baseUrl = 'http://plif.courageunfettered.com/'
|
||||
url = baseUrl + 'archive/arch2002.htm'
|
||||
stripUrl = baseUrl + 'archive/arch%s.htm'
|
||||
firstStripUrl = stripUrl % '1998'
|
||||
imageSearch = compile(r'<td align="center"><A TARGET=_parent HREF="(wc\d+\..+?)">')
|
||||
multipleImagesPerStrip = True
|
||||
|
@ -147,9 +147,9 @@ class TheWhiteboard(_BasicScraper):
|
|||
|
||||
class HMHigh(_BasicScraper):
|
||||
name = 'TheFallenAngel/HMHigh'
|
||||
baseurl = 'http://www.thefallenangel.co.uk/'
|
||||
url = baseurl + 'hmhigh/'
|
||||
rurl = escape(baseurl)
|
||||
baseUrl = 'http://www.thefallenangel.co.uk/'
|
||||
url = baseUrl + 'hmhigh/'
|
||||
rurl = escape(baseUrl)
|
||||
stripUrl = url + '?id=%s'
|
||||
imageSearch = compile(r'<img src="(%shmhigh/img/comic/.+?)"' % rurl)
|
||||
prevSearch = compile(r' <a href="(%s.+?)" title=".+?">Prev</a>' % rurl)
|
||||
|
|
|
@ -20,9 +20,9 @@ class Undertow(_BasicScraper):
|
|||
|
||||
|
||||
class UnicornJelly(_BasicScraper):
|
||||
baseurl = 'http://unicornjelly.com/'
|
||||
url = baseurl + 'uni666.html'
|
||||
stripUrl = baseurl + 'uni%s.html'
|
||||
baseUrl = 'http://unicornjelly.com/'
|
||||
url = baseUrl + 'uni666.html'
|
||||
stripUrl = baseUrl + 'uni%s.html'
|
||||
firstStripUrl = stripUrl % '001'
|
||||
imageSearch = compile(r'</TABLE>(?:<FONT COLOR="BLACK">)?<IMG SRC="(images/[^"]+)" WIDTH=')
|
||||
prevSearch = compile(r'<A HREF="(uni\d{3}[bcs]?\.html)">(<FONT COLOR="BLACK">)?<IMG SRC="images/back00\.gif"')
|
||||
|
|
|
@ -75,18 +75,18 @@ class WeCanSleepTomorrow(_BasicScraper):
|
|||
|
||||
|
||||
class WhiteNinja(_BasicScraper):
|
||||
baseurl = 'http://www.whiteninjacomics.com/'
|
||||
url = baseurl + 'comics.shtml'
|
||||
stripUrl = baseurl + 'comics/%s.shtml'
|
||||
baseUrl = 'http://www.whiteninjacomics.com/'
|
||||
url = baseUrl + 'comics.shtml'
|
||||
stripUrl = baseUrl + 'comics/%s.shtml'
|
||||
imageSearch = compile(r'<img src=(/images/comics/(?!t-).+?\.gif) border=0')
|
||||
prevSearch = compile(r'(/comics/.+?shtml).+?previous')
|
||||
help = 'Index format: s (comic name)'
|
||||
|
||||
|
||||
class WhiteNoise(_BasicScraper):
|
||||
baseurl = 'http://www.wncomic.com/'
|
||||
url = baseurl + 'archive.php'
|
||||
stripUrl = baseurl + 'archive_comments.php?strip_id=%s'
|
||||
baseUrl = 'http://www.wncomic.com/'
|
||||
url = baseUrl + 'archive.php'
|
||||
stripUrl = baseUrl + 'archive_comments.php?strip_id=%s'
|
||||
firstStripUrl = stripUrl % '1'
|
||||
imageSearch = compile(r'(istrip_files/strips/.+?)"')
|
||||
prevSearch = compile(r'</a><a href="(.+?)"><img src="images/top_back.jpg" ')
|
||||
|
@ -94,10 +94,10 @@ class WhiteNoise(_BasicScraper):
|
|||
|
||||
|
||||
class WhyTheLongFace(_BasicScraper):
|
||||
baseurl = 'http://www.absurdnotions.org/'
|
||||
rurl = escape(baseurl)
|
||||
url = baseurl + 'wtlf200709.html'
|
||||
stripUrl = baseurl + 'wtlf%s.html'
|
||||
baseUrl = 'http://www.absurdnotions.org/'
|
||||
rurl = escape(baseUrl)
|
||||
url = baseUrl + 'wtlf200709.html'
|
||||
stripUrl = baseUrl + 'wtlf%s.html'
|
||||
firstStripUrl = stripUrl % '200306'
|
||||
imageSearch = compile(r'<img src="(%swtlf.+?|lf\d+.\w{1,4})"' % rurl, IGNORECASE)
|
||||
multipleImagesPerStrip = True
|
||||
|
@ -134,26 +134,26 @@ class Wondermark(_BasicScraper):
|
|||
|
||||
|
||||
class WorldOfMrToast(_BasicScraper):
|
||||
baseurl = 'http://www.theimaginaryworld.com/'
|
||||
url = baseurl + 'mrTcomicA.html'
|
||||
stripUrl = baseurl + '%s.html'
|
||||
baseUrl = 'http://www.theimaginaryworld.com/'
|
||||
url = baseUrl + 'mrTcomicA.html'
|
||||
stripUrl = baseUrl + '%s.html'
|
||||
imageSearch = compile(tagre("img", "src", r'(comic[^"]+)'))
|
||||
# list the archive links since there is no prev/next navigation
|
||||
prevurls = (
|
||||
url,
|
||||
baseurl + 'mrTcomicW02.html',
|
||||
baseurl + 'mrTcomicW01.html',
|
||||
baseurl + 'mrGcomic03.html',
|
||||
baseurl + 'mrGcomic02.html',
|
||||
baseurl + 'mrGcomic01.html',
|
||||
baseurl + 'mrTcomicT05.html',
|
||||
baseurl + 'mrTcomicT04.html',
|
||||
baseurl + 'mrTcomicT03.html',
|
||||
baseurl + 'mrTcomicT02.html',
|
||||
baseurl + 'mrTcomicT01.html',
|
||||
baseurl + 'mrTcomicIW3.html',
|
||||
baseurl + 'mrTcomicIW2.html',
|
||||
baseurl + 'mrTcomicIW1.html',
|
||||
baseUrl + 'mrTcomicW02.html',
|
||||
baseUrl + 'mrTcomicW01.html',
|
||||
baseUrl + 'mrGcomic03.html',
|
||||
baseUrl + 'mrGcomic02.html',
|
||||
baseUrl + 'mrGcomic01.html',
|
||||
baseUrl + 'mrTcomicT05.html',
|
||||
baseUrl + 'mrTcomicT04.html',
|
||||
baseUrl + 'mrTcomicT03.html',
|
||||
baseUrl + 'mrTcomicT02.html',
|
||||
baseUrl + 'mrTcomicT01.html',
|
||||
baseUrl + 'mrTcomicIW3.html',
|
||||
baseUrl + 'mrTcomicIW2.html',
|
||||
baseUrl + 'mrTcomicIW1.html',
|
||||
)
|
||||
firstStripUrl = prevurls[-1]
|
||||
multipleImagesPerStrip = True
|
||||
|
|
Loading…
Reference in a new issue