s/baseurl/baseUrl/g

This commit is contained in:
Bastian Kleineidam 2013-04-13 20:58:00 +02:00
parent c246b41d64
commit f15f993851
15 changed files with 119 additions and 119 deletions

View file

@ -18,9 +18,9 @@ class AbleAndBaker(_BasicScraper):
class AbsurdNotions(_BasicScraper):
baseurl = 'http://www.absurdnotions.org/'
url = baseurl + 'page129.html'
stripUrl = baseurl + 'page%s.html'
baseUrl = 'http://www.absurdnotions.org/'
url = baseUrl + 'page129.html'
stripUrl = baseUrl + 'page%s.html'
firstStripUrl = stripUrl % '1'
imageSearch = compile(tagre('img', 'src', r'(an[^"]+)'))
multipleImagesPerStrip = True
@ -74,9 +74,9 @@ class AetheriaEpics(_BasicScraper):
class AfterStrife(_BasicScraper):
baseurl = 'http://afterstrife.com/'
rurl = escape(baseurl)
stripUrl = baseurl + '?p=%s'
baseUrl = 'http://afterstrife.com/'
rurl = escape(baseUrl)
stripUrl = baseUrl + '?p=%s'
url = stripUrl % '262'
firstStripUrl = stripUrl % '1'
imageSearch = compile(r'<img src="(%sstrips/.+?)"' % rurl)
@ -148,9 +148,9 @@ class AlienLovesPredator(_BasicScraper):
class AlienShores(_BasicScraper):
baseurl = 'http://alienshores.com/'
rurl = escape(baseurl)
url = baseurl + 'alienshores_band/'
baseUrl = 'http://alienshores.com/'
rurl = escape(baseUrl)
url = baseUrl + 'alienshores_band/'
stripUrl = url + '%s'
imageSearch = compile(tagre("img", "src", r'(%salienshores_band/wp-content/uploads/[^"]+)' % rurl))
prevSearch = compile(tagre("a", "href", r'(%s[^"]+)' % rurl, after="prev"))
@ -258,10 +258,10 @@ class Angels2200(_BasicScraper):
class Annyseed(_BasicScraper):
baseurl = 'http://www.colourofivy.com/'
rurl = escape(baseurl)
url = baseurl + 'annyseed_webcomic_latest.htm'
stripUrl = baseurl + 'annyseed_webcomic%s.htm'
baseUrl = 'http://www.colourofivy.com/'
rurl = escape(baseUrl)
url = baseUrl + 'annyseed_webcomic_latest.htm'
stripUrl = baseUrl + 'annyseed_webcomic%s.htm'
imageSearch = compile(tagre("img", "src", r'(Annyseed[^"]+)'))
prevSearch = compile(r'<a href="(%s[^"]+)"><img src="Last.gif"' % rurl)
help = 'Index format: nnn'
@ -297,11 +297,11 @@ class ASofterWorld(_BasicScraper):
class AstronomyPOTD(_BasicScraper):
baseurl = 'http://antwrp.gsfc.nasa.gov/apod/'
url = baseurl + 'astropix.html'
baseUrl = 'http://antwrp.gsfc.nasa.gov/apod/'
url = baseUrl + 'astropix.html'
starter = bounceStarter(url,
compile(tagre("a", "href", r'(ap\d{6}\.html)') + "&gt;</a>"))
stripUrl = baseurl + 'ap%s.html'
stripUrl = baseUrl + 'ap%s.html'
firstStripUrl = stripUrl % '061012'
imageSearch = compile(tagre("a", "href", r'(image/\d{4}/[^"]+)'))
multipleImagesPerStrip = True

View file

@ -101,11 +101,11 @@ class ChainsawSuit(_BasicScraper):
class Champ2010(_BasicScraper):
baseurl = 'http://jedcollins.com/champ2010/'
rurl = escape(baseurl)
baseUrl = 'http://jedcollins.com/champ2010/'
rurl = escape(baseUrl)
# the latest URL is hard coded since the comic is discontinued
url = baseurl + 'champ-12-30-10.html'
stripUrl = baseurl + '%s.html'
url = baseUrl + 'champ-12-30-10.html'
stripUrl = baseUrl + '%s.html'
firstStripUrl = stripUrl % 'champ1-1-10-fuck'
imageSearch = compile(tagre("img", "src", r'(%scomics/[^"]+)' % rurl))
prevSearch = compile(tagre("a", "href", r'(%s[^"]+)' % rurl, after="Previous"))
@ -323,9 +323,9 @@ class CrimsonDark(_BasicScraper):
class CraftedFables(_BasicScraper):
url = 'http://www.craftedfables.com/'
baseurl = 'http://www.caf-fiends.net/'
rurl = escape(baseurl)
stripUrl = baseurl + 'craftedfables/?p=%s'
baseUrl = 'http://www.caf-fiends.net/'
rurl = escape(baseUrl)
stripUrl = baseUrl + 'craftedfables/?p=%s'
imageSearch = compile(tagre("img", "src", r'(%scraftedfables/comics/[^"]+)' % rurl))
prevSearch = compile(tagre("a", "href", r'(%scraftedfables/[^"]+)' % rurl) +
tagre("span", "class", r"prev"))

View file

@ -9,12 +9,12 @@ from ..util import tagre
_imageSearch = compile(tagre("a", "href", r'(/comics/\d+/[^"]+)'))
def add(name, path):
baseurl = 'http://www.creators.com'
baseUrl = 'http://www.creators.com'
classname = 'Creators_%s' % name
globals()[classname] = make_scraper(classname,
name = 'Creators/' + name,
url = baseurl + path + '.html',
stripUrl = baseurl + path + '/%s.html',
url = baseUrl + path + '.html',
stripUrl = baseUrl + path + '/%s.html',
lang = 'es' if name.lower().endswith('spanish') else 'en',
imageSearch = _imageSearch,
prevSearch = compile(tagre("a", "href", r'(%s/\d+\.html)' % path) +

View file

@ -258,9 +258,9 @@ class DresdenCodak(_BasicScraper):
class DrFun(_BasicScraper):
baseurl = 'http://www.ibiblio.org/Dave/'
url = baseurl + 'ar00502.htm'
stripUrl = baseurl + 'ar%s.htm'
baseUrl = 'http://www.ibiblio.org/Dave/'
url = baseUrl + 'ar00502.htm'
stripUrl = baseUrl + 'ar%s.htm'
firstStripUrl = stripUrl % '00001'
imageSearch = compile(tagre("a", "href", r'(Dr-Fun/df\d+/df[^"]+)'))
multipleImagesPerStrip = True
@ -280,9 +280,9 @@ class DrMcNinja(_BasicScraper):
class Drowtales(_BasicScraper):
baseurl = 'http://www.drowtales.com/'
rurl = escape(baseurl)
url = baseurl + 'mainarchive.php'
baseUrl = 'http://www.drowtales.com/'
rurl = escape(baseUrl)
url = baseUrl + 'mainarchive.php'
stripUrl = url + '?sid=%s'
firstStripUrl = stripUrl % '4192'
imageSearch = (

View file

@ -19,9 +19,9 @@ class FalconTwin(_BasicScraper):
class Fallen(_BasicScraper):
baseurl = 'http://www.fallencomic.com/'
url = baseurl + 'fal-page.htm'
stripUrl = baseurl + 'pages/part%s/%s-p%s.htm'
baseUrl = 'http://www.fallencomic.com/'
url = baseUrl + 'fal-page.htm'
stripUrl = baseUrl + 'pages/part%s/%s-p%s.htm'
imageSearch = compile(r'<IMG SRC="(page/.+?)"', IGNORECASE)
prevSearch = compile(r'<A HREF="(.+?)"><FONT FACE="Courier">Back', IGNORECASE)
help = 'Index format: nn-m (comicNumber-partNumber)'
@ -59,9 +59,9 @@ class FauxPas(_BasicScraper):
class FeyWinds(_BasicScraper):
baseurl = 'http://kitsune.rydia.net/'
url = baseurl + 'index.html'
stripUrl = baseurl + 'comic/page.php?id=%s'
baseUrl = 'http://kitsune.rydia.net/'
url = baseUrl + 'index.html'
stripUrl = baseUrl + 'comic/page.php?id=%s'
imageSearch = compile(r"(../comic/pages//.+?)'")
prevSearch = compile(r"(page.php\?id=.+?)'.+?navprevious.png")
help = 'Index format: n (unpadded)'
@ -89,9 +89,9 @@ class FirstWorldProblems(_BasicScraper):
class FlakyPastry(_BasicScraper):
baseurl = 'http://flakypastry.runningwithpencils.com/'
url = baseurl + 'index.php'
stripUrl = baseurl + 'comic.php?strip_id=%s'
baseUrl = 'http://flakypastry.runningwithpencils.com/'
url = baseUrl + 'index.php'
stripUrl = baseUrl + 'comic.php?strip_id=%s'
firstStripUrl = stripUrl % '0'
imageSearch = compile(r'<img src="(comics/.+?)"')
prevSearch = compile(r'<a href="(.+?)".+?btn_back')

View file

@ -20,12 +20,12 @@ class Galaxion(_BasicScraper):
class Garanos(_BasicScraper):
baseurl = 'http://garanos.alexheberling.com/'
rurl = escape(baseurl)
url = baseurl + 'pages/page-1/'
baseUrl = 'http://garanos.alexheberling.com/'
rurl = escape(baseUrl)
url = baseUrl + 'pages/page-1/'
starter = indirectStarter(url,
compile(tagre("a", "href", r'(%spages/[^"]+)' % rurl, after="navi-last")))
stripUrl = baseurl + 'pages/page-%s'
stripUrl = baseUrl + 'pages/page-%s'
imageSearch = compile(tagre("img", "src", r'(%scomics/[^"]+)' % rurl))
prevSearch = compile(tagre("a", "href", r'(%spages/[^"]+)' % rurl, after="prev"))
help = 'Index format: n (unpadded)'

View file

@ -35,9 +35,9 @@ class KevinAndKell(_BasicScraper):
class Key(_BasicScraper):
baseurl = 'http://key.shadilyn.com/'
url = baseurl + 'latestpage.html'
stripUrl = baseurl + 'pages/%s.html'
baseUrl = 'http://key.shadilyn.com/'
url = baseUrl + 'latestpage.html'
stripUrl = baseUrl + 'pages/%s.html'
imageSearch = compile(r'"((?:images/.+?)|(?:pages/images/.+?))"')
prevSearch = compile(r'</a><a href="(.+?html)".+?prev')
help = 'Index format: nnn'
@ -54,9 +54,9 @@ class KickInTheHead(_BasicScraper):
class KillerKomics(_BasicScraper):
baseurl = 'http://www.killerkomics.com/web-comics/'
url = baseurl + 'index_ang.cfm'
stripUrl = baseurl + '%s.cfm'
baseUrl = 'http://www.killerkomics.com/web-comics/'
url = baseUrl + 'index_ang.cfm'
stripUrl = baseUrl + '%s.cfm'
imageSearch = compile(r'<img src="(http://www.killerkomics.com/FichiersUpload/Comics/.+?)"')
prevSearch = compile(r'<div id="precedent"><a href="(.+?)"')
help = 'Index format: strip-name'
@ -82,9 +82,9 @@ class Krakow(_BasicScraper):
class Kukuburi(_BasicScraper):
baseurl = 'http://www.kukuburi.com/'
url = baseurl + 'current/'
stripUrl = baseurl + 'v2/%s/'
baseUrl = 'http://www.kukuburi.com/'
url = baseUrl + 'current/'
stripUrl = baseUrl + 'v2/%s/'
firstStripUrl = stripUrl % '2007/08/09/one'
imageSearch = compile(tagre("img", "src", r'(http://www\.kukuburi\.com/v2/comics/[^"]+)', after='alt="[^"]'))
prevSearch = compile(r'nav-previous.+?"(http.+?)"')

View file

@ -141,10 +141,10 @@ class NobodyScores(_BasicScraper):
class NoNeedForBushido(_BasicScraper):
baseurl = 'http://noneedforbushido.com/'
rurl = escape(baseurl)
url = baseurl + 'latest/'
stripUrl = baseurl + '%s/'
baseUrl = 'http://noneedforbushido.com/'
rurl = escape(baseUrl)
url = baseUrl + 'latest/'
stripUrl = baseUrl + '%s/'
imageSearch = compile(tagre("img", "src", r'(%scomics/comic/[^"]+)' % rurl))
prevSearch = compile(tagre("a", "href", r'(%s[^"]+)' % rurl, after="previous-comic-link"))
help = 'Index format: yyyy/comic/nnn'

View file

@ -50,9 +50,9 @@ class PartiallyClips(_BasicScraper):
class PastelDefender(_BasicScraper):
baseurl = 'http://www.pasteldefender.com/'
url = baseurl + 'coverbackcover.html'
stripUrl = baseurl + '%s.html'
baseUrl = 'http://www.pasteldefender.com/'
url = baseUrl + 'coverbackcover.html'
stripUrl = baseUrl + '%s.html'
firstStripUrl = stripUrl % 'cover'
imageSearch = compile(r'<IMG SRC="(images/.+?)" WIDTH="742"')
prevSearch = compile(r'<A HREF="([^"]+)"><IMG SRC="images/back\.gif"')
@ -107,9 +107,9 @@ class PeppermintSaga(_BasicScraper):
class PHDComics(_BasicScraper):
baseurl = 'http://phdcomics.com/'
url = baseurl + 'comics.php'
stripUrl = baseurl + 'comics/archive.php?comicid=%s'
baseUrl = 'http://phdcomics.com/'
url = baseUrl + 'comics.php'
stripUrl = baseUrl + 'comics/archive.php?comicid=%s'
firstStripUrl = stripUrl % '1'
imageSearch = compile(tagre("img", "src", r'(http://www\.phdcomics\.com/comics/archive/phd[^ ]+)', quote=""))
prevSearch = compile(tagre("a", "href", r'((?:comics/)?archive\.php\?comicid=\d+)', quote="") +
@ -167,9 +167,9 @@ class _PlanescapeSurvival(_BasicScraper):
class PokeyThePenguin(_BasicScraper):
baseurl = 'http://www.yellow5.com/pokey/archive/'
url = baseurl + 'index558.html'
stripUrl = baseurl + 'index%s.html'
baseUrl = 'http://www.yellow5.com/pokey/archive/'
url = baseUrl + 'index558.html'
stripUrl = baseUrl + 'index%s.html'
firstStripUrl = stripUrl % '1'
imageSearch = compile(tagre("img", "src", r'(pokey\d+[^"]+)'))
prevSearch = True

View file

@ -17,9 +17,9 @@ class QuestionableContent(_BasicScraper):
class Qwantz(_BasicScraper):
baseurl = 'http://www.qwantz.com/'
url = baseurl + 'index.php'
rurl = escape(baseurl)
baseUrl = 'http://www.qwantz.com/'
url = baseUrl + 'index.php'
rurl = escape(baseUrl)
stripUrl = url + '?comic=%s'
firstStripUrl = stripUrl % '1'
imageSearch = compile(tagre("img", "src", r'(%scomics/[^"]+)' % rurl))

View file

@ -35,10 +35,10 @@ class RealmOfAtland(_BasicScraper):
class RedMeat(_BasicScraper):
baseurl = 'http://www.redmeat.com/redmeat/'
url = baseurl + 'current/index.html'
baseUrl = 'http://www.redmeat.com/redmeat/'
url = baseUrl + 'current/index.html'
starter = bounceStarter(url, compile(r'<a href="(\.\./\d{4}-\d{2}-\d{2}/index\.html)">next</a>'))
stripUrl = baseurl + '%s/index.html'
stripUrl = baseUrl + '%s/index.html'
firstStripUrl = stripUrl % '1996-06-10'
imageSearch = compile(r'<img src="(index-1\.gif)" width="\d+" height="\d+" [^>]*>')
prevSearch = compile(r'<a href="(\.\./\d{4}-\d{2}-\d{2}/index\.html)">previous</a>')

View file

@ -316,9 +316,9 @@ class SodiumEyes(_BasicScraper):
class Sorcery101(_BasicScraper):
description = u'Welcome to the site of Kel McDonald, professional comic illustrator and writer.'
baseurl = 'http://www.sorcery101.net/'
url = baseurl + 'sorcery-101/'
rurl = escape(baseurl)
baseUrl = 'http://www.sorcery101.net/'
url = baseUrl + 'sorcery-101/'
rurl = escape(baseUrl)
stripUrl = url + '%s/'
imageSearch = compile(tagre("img", "src", r'(%swp-content/uploads/\d+/\d+/[^"]+)' % rurl))
prevSearch = compile(tagre("a", "href", r'(%ssorcery-101/[^"]+)' % rurl, after="previous-"))
@ -475,10 +475,10 @@ class SomethingPositive(_BasicScraper):
class StarCrossdDestiny(_BasicScraper):
description = u'Furturistic fantasy. A group of outcasts fight to survive in a world that shuns them as freaks.'
baseurl = 'http://www.starcrossd.net/'
rurl = escape(baseurl)
url = baseurl + 'comic.html'
stripUrl = baseurl + 'archives/%s.html'
baseUrl = 'http://www.starcrossd.net/'
rurl = escape(baseUrl)
url = baseUrl + 'comic.html'
stripUrl = baseUrl + 'archives/%s.html'
firstStripUrl = stripUrl % '00000001'
imageSearch = compile(tagre("img", "src", r'(%s(?:ch1|strips|book2)/[^"]+)' % rurl))
prevSearch = compile(r'<a href="(%s(?:ch1/)?archives/\d+\.html)"[^>]*"[^"]*"[^>]*>prev' % rurl, IGNORECASE)

View file

@ -37,14 +37,14 @@ class TheNoob(_BasicScraper):
class TheOrderOfTheStick(_BasicScraper):
baseurl = 'http://www.giantitp.com/'
url = baseurl + 'comics/oots0863.html'
stripUrl = baseurl + 'comics/oots%s.html'
baseUrl = 'http://www.giantitp.com/'
url = baseUrl + 'comics/oots0863.html'
stripUrl = baseUrl + 'comics/oots%s.html'
firstStripUrl = stripUrl % '0001'
imageSearch = compile(r'<IMG src="(/comics/images/[^"]+)">')
prevSearch = compile(r'<A href="(/comics/oots\d{4}\.html)"><IMG src="/Images/redesign/ComicNav_Back.gif"')
help = 'Index format: n (unpadded)'
starter = indirectStarter(baseurl, compile(r'<A href="(/comics/oots\d{4}\.html)"'))
starter = indirectStarter(baseUrl, compile(r'<A href="(/comics/oots\d{4}\.html)"'))
@classmethod
def namer(cls, imageUrl, pageUrl):
@ -52,9 +52,9 @@ class TheOrderOfTheStick(_BasicScraper):
class TheParkingLotIsFull(_BasicScraper):
baseurl = 'http://plif.courageunfettered.com/'
url = baseurl + 'archive/arch2002.htm'
stripUrl = baseurl + 'archive/arch%s.htm'
baseUrl = 'http://plif.courageunfettered.com/'
url = baseUrl + 'archive/arch2002.htm'
stripUrl = baseUrl + 'archive/arch%s.htm'
firstStripUrl = stripUrl % '1998'
imageSearch = compile(r'<td align="center"><A TARGET=_parent HREF="(wc\d+\..+?)">')
multipleImagesPerStrip = True
@ -147,9 +147,9 @@ class TheWhiteboard(_BasicScraper):
class HMHigh(_BasicScraper):
name = 'TheFallenAngel/HMHigh'
baseurl = 'http://www.thefallenangel.co.uk/'
url = baseurl + 'hmhigh/'
rurl = escape(baseurl)
baseUrl = 'http://www.thefallenangel.co.uk/'
url = baseUrl + 'hmhigh/'
rurl = escape(baseUrl)
stripUrl = url + '?id=%s'
imageSearch = compile(r'<img src="(%shmhigh/img/comic/.+?)"' % rurl)
prevSearch = compile(r' <a href="(%s.+?)" title=".+?">Prev</a>' % rurl)

View file

@ -20,9 +20,9 @@ class Undertow(_BasicScraper):
class UnicornJelly(_BasicScraper):
baseurl = 'http://unicornjelly.com/'
url = baseurl + 'uni666.html'
stripUrl = baseurl + 'uni%s.html'
baseUrl = 'http://unicornjelly.com/'
url = baseUrl + 'uni666.html'
stripUrl = baseUrl + 'uni%s.html'
firstStripUrl = stripUrl % '001'
imageSearch = compile(r'</TABLE>(?:<FONT COLOR="BLACK">)?<IMG SRC="(images/[^"]+)" WIDTH=')
prevSearch = compile(r'<A HREF="(uni\d{3}[bcs]?\.html)">(<FONT COLOR="BLACK">)?<IMG SRC="images/back00\.gif"')

View file

@ -75,18 +75,18 @@ class WeCanSleepTomorrow(_BasicScraper):
class WhiteNinja(_BasicScraper):
baseurl = 'http://www.whiteninjacomics.com/'
url = baseurl + 'comics.shtml'
stripUrl = baseurl + 'comics/%s.shtml'
baseUrl = 'http://www.whiteninjacomics.com/'
url = baseUrl + 'comics.shtml'
stripUrl = baseUrl + 'comics/%s.shtml'
imageSearch = compile(r'<img src=(/images/comics/(?!t-).+?\.gif) border=0')
prevSearch = compile(r'(/comics/.+?shtml).+?previous')
help = 'Index format: s (comic name)'
class WhiteNoise(_BasicScraper):
baseurl = 'http://www.wncomic.com/'
url = baseurl + 'archive.php'
stripUrl = baseurl + 'archive_comments.php?strip_id=%s'
baseUrl = 'http://www.wncomic.com/'
url = baseUrl + 'archive.php'
stripUrl = baseUrl + 'archive_comments.php?strip_id=%s'
firstStripUrl = stripUrl % '1'
imageSearch = compile(r'(istrip_files/strips/.+?)"')
prevSearch = compile(r'</a><a href="(.+?)"><img src="images/top_back.jpg" ')
@ -94,10 +94,10 @@ class WhiteNoise(_BasicScraper):
class WhyTheLongFace(_BasicScraper):
baseurl = 'http://www.absurdnotions.org/'
rurl = escape(baseurl)
url = baseurl + 'wtlf200709.html'
stripUrl = baseurl + 'wtlf%s.html'
baseUrl = 'http://www.absurdnotions.org/'
rurl = escape(baseUrl)
url = baseUrl + 'wtlf200709.html'
stripUrl = baseUrl + 'wtlf%s.html'
firstStripUrl = stripUrl % '200306'
imageSearch = compile(r'<img src="(%swtlf.+?|lf\d+.\w{1,4})"' % rurl, IGNORECASE)
multipleImagesPerStrip = True
@ -134,26 +134,26 @@ class Wondermark(_BasicScraper):
class WorldOfMrToast(_BasicScraper):
baseurl = 'http://www.theimaginaryworld.com/'
url = baseurl + 'mrTcomicA.html'
stripUrl = baseurl + '%s.html'
baseUrl = 'http://www.theimaginaryworld.com/'
url = baseUrl + 'mrTcomicA.html'
stripUrl = baseUrl + '%s.html'
imageSearch = compile(tagre("img", "src", r'(comic[^"]+)'))
# list the archive links since there is no prev/next navigation
prevurls = (
url,
baseurl + 'mrTcomicW02.html',
baseurl + 'mrTcomicW01.html',
baseurl + 'mrGcomic03.html',
baseurl + 'mrGcomic02.html',
baseurl + 'mrGcomic01.html',
baseurl + 'mrTcomicT05.html',
baseurl + 'mrTcomicT04.html',
baseurl + 'mrTcomicT03.html',
baseurl + 'mrTcomicT02.html',
baseurl + 'mrTcomicT01.html',
baseurl + 'mrTcomicIW3.html',
baseurl + 'mrTcomicIW2.html',
baseurl + 'mrTcomicIW1.html',
baseUrl + 'mrTcomicW02.html',
baseUrl + 'mrTcomicW01.html',
baseUrl + 'mrGcomic03.html',
baseUrl + 'mrGcomic02.html',
baseUrl + 'mrGcomic01.html',
baseUrl + 'mrTcomicT05.html',
baseUrl + 'mrTcomicT04.html',
baseUrl + 'mrTcomicT03.html',
baseUrl + 'mrTcomicT02.html',
baseUrl + 'mrTcomicT01.html',
baseUrl + 'mrTcomicIW3.html',
baseUrl + 'mrTcomicIW2.html',
baseUrl + 'mrTcomicIW1.html',
)
firstStripUrl = prevurls[-1]
multipleImagesPerStrip = True