2012-06-20 20:41:04 +00:00
|
|
|
# -*- coding: iso-8859-1 -*-
|
|
|
|
# Copyright (C) 2004-2005 Tristan Seligmann and Jonathan Jacobs
|
2012-06-20 19:58:13 +00:00
|
|
|
from re import compile
|
|
|
|
|
2012-10-11 10:03:12 +00:00
|
|
|
from ..scraper import _BasicScraper
|
2012-11-13 05:51:54 +00:00
|
|
|
from ..helpers import constStarter, bounceStarter
|
2012-10-11 10:03:12 +00:00
|
|
|
from ..util import tagre, getQueryParams
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
|
|
|
|
class CalvinAndHobbes(_BasicScraper):
|
2012-10-11 10:03:12 +00:00
|
|
|
starter = bounceStarter('http://www.gocomics.com/calvinandhobbes/',
|
|
|
|
compile(tagre("a", "href", "(/calvinandhobbes/\d+/\d+/\d+)")+"Next feature</a>"))
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.gocomics.com/calvinandhobbes/%s'
|
2012-10-11 10:03:12 +00:00
|
|
|
imageSearch = compile(tagre("img", "src", "(http://assets\.amuniversal\.com/[a-f0-9]+)"))
|
|
|
|
prevSearch = compile(tagre("a", "href", "(/calvinandhobbes/\d+/\d+/\d+)")+"Previous feature</a>")
|
2012-06-20 19:58:13 +00:00
|
|
|
help = 'Index format: yyyy/mm/dd'
|
|
|
|
|
2012-10-11 10:03:12 +00:00
|
|
|
@classmethod
|
|
|
|
def namer(cls, imageUrl, pageUrl):
|
|
|
|
prefix, year, month, day = pageUrl.rsplit('/', 3)
|
|
|
|
return "%s%s%s.gif" % (year, month, day)
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
|
|
|
|
class CandyCartoon(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.candycartoon.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.candycartoon.com/archives/%s.html'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img alt="[^"]*" src="(http://www\.candycartoon\.com/archives/[^"]+)"')
|
|
|
|
prevSearch = compile(r'<a href="(http://www\.candycartoon\.com/archives/\d{6}\.html)">prev')
|
|
|
|
help = 'Index format: nnnnnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CaptainSNES(_BasicScraper):
|
|
|
|
latestUrl = 'http://captainsnes.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://captainsnes.com/?date=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src=\'(http://www.captainsnes.com/comics/.+?)\'')
|
|
|
|
prevSearch = compile(r'<a href="http://www.captainsnes.com/(.+?)"><span class="prev">')
|
|
|
|
help = 'Index format: yyyymmdd'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CaribbeanBlue(_BasicScraper):
|
|
|
|
latestUrl = 'http://cblue.katbox.net/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://cblue.katbox.net/index.php?strip_id=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'="(.+?strips/.+?)"')
|
|
|
|
prevSearch = compile(r'<a href="(.+?)"><img src="images/navigation_back.png"')
|
|
|
|
help = 'Index format: n (unpadded)'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Catena(_BasicScraper):
|
|
|
|
latestUrl = 'http://catenamanor.com/'
|
2012-11-14 19:23:30 +00:00
|
|
|
stripUrl = latestUrl + '%s'
|
2012-11-12 17:59:19 +00:00
|
|
|
imageSearch = compile(tagre("img", "src", r'(http://catenamanor\.com/comics/[^"]+)'))
|
2012-11-13 18:12:28 +00:00
|
|
|
prevSearch = compile(tagre("a", "href", r'([^"]+)', after='rel="prev"'))
|
2012-11-14 19:23:30 +00:00
|
|
|
help = 'Index format: yyyy/mm/dd/<name>'
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
|
|
|
|
class Catharsis(_BasicScraper):
|
|
|
|
latestUrl = 'http://catharsiscomic.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://catharsiscomic.com/archive.php?strip=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(strips/.+?)"')
|
|
|
|
prevSearch = compile(r'<a href="(.+?)".+"Previous')
|
|
|
|
help = 'Index format: yymmdd-<your guess>.html'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class ChasingTheSunset(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.fantasycomic.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.fantasycomic.com/index.php?p=c%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'(/cmsimg/.+?)".+?comic-img')
|
|
|
|
prevSearch = compile(r'<a href="(.+?)" title="" ><img src="(images/eye-prev.png|images/cn-prev.png)"')
|
|
|
|
help = 'Index format: n'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Chisuji(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.chisuji.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.chisuji.com/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://www.chisuji.com/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<div class="nav-previous"><a href="(http://www.chisuji.com/.+?)">')
|
|
|
|
help = 'Index format: yyyy/mm/dd/strip-name'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class ChugworthAcademy(_BasicScraper):
|
|
|
|
latestUrl = 'http://chugworth.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://chugworth.com/?p=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(.+?)" alt="Comic')
|
|
|
|
prevSearch = compile(r'<a href="(http://chugworth.com/\?p=\d{1,4})"[^>]+?title="Previous">')
|
|
|
|
help = 'Index format: n (unpadded)'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class ChugworthAcademyArchive(_BasicScraper):
|
|
|
|
latestUrl = 'http://chugworth.com/archive/?strip_id=422'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://chugworth.com/archive/?strip_id=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src=(comics/\d+.+?.\w{1,4})')
|
|
|
|
prevSearch = compile(r'<a href=\'(.+?)\'><img src=\'images/previous.gif')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CigarroAndCerveja(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.cigarro.ca/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.cigarro.ca/?p=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r"(/comics/.+?)'")
|
|
|
|
prevSearch = compile(r'(/\?p=.+?)">&laq')
|
|
|
|
help = 'Index format: non'
|
|
|
|
|
|
|
|
|
2012-11-14 19:23:30 +00:00
|
|
|
# XXX move
|
|
|
|
class TinyKittenTeeth(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.tinykittenteeth.com/'
|
|
|
|
stripUrl = latestUrl + 'index.php?current=%s'
|
|
|
|
imageSearch = compile(tagre("img", "src", r'(http://www\.tinykittenteeth\.com/comics/[^"]+)'))
|
|
|
|
prevSearch = compile(tagre("a", "href", r'([^"]+)', after="Previous"))
|
2012-06-20 19:58:13 +00:00
|
|
|
help = 'Index format: n (unpadded)'
|
|
|
|
|
|
|
|
|
|
|
|
class Comedity(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.comedity.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.comedity.com/index.php?strip_id=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(Comedity_files/.+?)"')
|
|
|
|
prevSearch = compile(r'<a href="(/?index.php\?strip_id=\d+?)"> *<img alt=\"Prior Strip')
|
|
|
|
help = 'Index format: n (no padding)'
|
|
|
|
|
|
|
|
|
|
|
|
class Commissioned(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.commissionedcomic.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.commissionedcomic.com/index.php?strip=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://www.commissionedcomic.com/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<a href="(.+?)">‹</a>')
|
|
|
|
help = 'Index format: n'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CoolCatStudio(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.coolcatstudio.com/'
|
2012-11-14 05:22:08 +00:00
|
|
|
stripUrl = 'http://www.coolcatstudio.com/strips-cat/ccs%s'
|
2012-11-13 18:12:28 +00:00
|
|
|
imageSearch = compile(tagre("img", "src", r'(http://www.coolcatstudio.com/comics/[^"]+)'))
|
|
|
|
prevSearch = compile(tagre("a", "href", r'(http://www\.coolcatstudio\.com/strips-cat/[^"]+)', before="cniprevt"))
|
2012-11-14 05:22:08 +00:00
|
|
|
help = 'Index format: yyyymmdd'
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CourtingDisaster(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.courting-disaster.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.courting-disaster.com/archive/%s.html'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'(/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'</a><a href="(.+?)"><img src="/images/previous.gif"[^>]+?>')
|
|
|
|
help = 'Index format: yyyymmdd'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CrapIDrewOnMyLunchBreak(_BasicScraper):
|
|
|
|
latestUrl = 'http://crap.jinwicked.com/'
|
2012-11-14 19:23:30 +00:00
|
|
|
stripUrl = latestUrl + '%s'
|
|
|
|
imageSearch = compile(tagre("img", "src", r'(http://crap\.jinwicked\.com/comics/[^"]+)'))
|
|
|
|
prevSearch = compile(tagre("a", "href", r'([^"]+)', after="prev"))
|
2012-06-20 19:58:13 +00:00
|
|
|
help = 'Index format: yyyy/mm/dd/name'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CtrlAltDel(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.cad-comic.com/cad/'
|
2012-11-14 19:23:30 +00:00
|
|
|
stripUrl = latestUrl + '%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(/comics/\w+/\d{8}\..+?)"')
|
|
|
|
prevSearch = compile(r'<a href="(/\w+/\d{8})" class="nav-back')
|
|
|
|
help = 'Index format: yyyymmdd'
|
|
|
|
|
|
|
|
|
|
|
|
class CtrlAltDelSillies(CtrlAltDel):
|
|
|
|
name = 'CtrlAltDel/Sillies'
|
|
|
|
latestUrl = 'http://www.cad-comic.com/sillies/'
|
2012-11-14 19:23:30 +00:00
|
|
|
stripUrl = latestUrl + '%s'
|
|
|
|
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
class Curvy(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.c.urvy.org/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.c.urvy.org/?date=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'(/c/.+?)"')
|
|
|
|
prevSearch = compile(r'(/\?date=.+?)"><< Previous page')
|
|
|
|
help = 'Index format: yyyymmdd'
|
|
|
|
|
|
|
|
|
|
|
|
def cloneManga(name, shortName, lastStrip=None):
|
2012-11-12 17:59:19 +00:00
|
|
|
url = 'http://manga.clone-army.org'
|
|
|
|
baseUrl = '%s/%s.php' % (url, shortName)
|
2012-11-14 19:23:30 +00:00
|
|
|
stripUrl = baseUrl + '?page=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
if lastStrip is None:
|
2012-11-12 17:59:19 +00:00
|
|
|
starter = bounceStarter(baseUrl, compile(tagre("a", "href", r'([^"]+)')+tagre("img", "src", r"next\.gif")))
|
2012-06-20 19:58:13 +00:00
|
|
|
else:
|
2012-11-13 18:10:19 +00:00
|
|
|
starter = constStarter(stripUrl % lastStrip)
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
def namer(self, imageUrl, pageUrl):
|
2012-11-12 17:59:19 +00:00
|
|
|
return '%03d' % int(getQueryParams(pageUrl)['page'][0])
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
return type('CloneManga_%s' % name,
|
|
|
|
(_BasicScraper,),
|
|
|
|
dict(
|
|
|
|
name='CloneManga/' + name,
|
|
|
|
starter=starter,
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl=stripUrl,
|
2012-11-13 18:12:28 +00:00
|
|
|
imageSearch=compile(tagre("img", "src", r'((?:%s/)?%s/[^"]+)' % (url, shortName), after="center")),
|
2012-11-12 17:59:19 +00:00
|
|
|
prevSearch=compile(tagre("a", "href", r'([^"]+)')+tagre("img", "src", r"previous\.gif")),
|
2012-06-20 19:58:13 +00:00
|
|
|
help='Index format: n',
|
|
|
|
namer=namer)
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
anm = cloneManga('AprilAndMay', 'anm')
|
|
|
|
kanami = cloneManga('Kanami', 'kanami')
|
|
|
|
momoka = cloneManga('MomokaCorner', 'momoka')
|
|
|
|
nana = cloneManga('NanasEverydayLife', 'nana', '78')
|
|
|
|
pxi = cloneManga('PaperEleven', 'pxi', '311')
|
|
|
|
t42r = cloneManga('Tomoyo42sRoom', 't42r')
|
|
|
|
penny = cloneManga('PennyTribute', 'penny')
|
|
|
|
|
|
|
|
|
|
|
|
class CatAndGirl(_BasicScraper):
|
|
|
|
latestUrl = 'http://catandgirl.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://catandgirl.com/?p=%s'
|
2012-10-11 19:32:15 +00:00
|
|
|
imageSearch = compile(tagre("img", "src", r'(http://catandgirl\.com/archive/[^"]+)'))
|
|
|
|
prevSearch = compile(tagre("a", "href", r'([^"]+)')+r"[^<]+Previous</a>")
|
2012-06-20 19:58:13 +00:00
|
|
|
help = 'Index format: n (unpadded)'
|
|
|
|
|
|
|
|
|
|
|
|
def comicsDotCom(name, section):
|
2012-10-12 19:47:57 +00:00
|
|
|
latestUrl = 'http://www.gocomics.com/%s' % name
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def namer(cls, imageUrl, pageUrl):
|
2012-10-12 19:47:57 +00:00
|
|
|
prefix, year, month, day = pageUrl.split('/', 3)
|
|
|
|
return "%s_%s%s%s.gif" % (name, year, month, day)
|
2012-06-20 19:58:13 +00:00
|
|
|
|
2012-10-12 19:47:57 +00:00
|
|
|
return type('GoComicsDotCom_%s' % name,
|
2012-06-20 19:58:13 +00:00
|
|
|
(_BasicScraper,),
|
|
|
|
dict(
|
2012-10-12 19:47:57 +00:00
|
|
|
name='GoComicsDotCom/' + name,
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl=latestUrl + '/%s',
|
2012-10-12 19:47:57 +00:00
|
|
|
imageSearch=compile(tagre("img", "src", r'(http://assets\.amuniversal\.com/[0-9a-f]+)')),
|
|
|
|
prevSearch=compile(tagre("a", "href", "(/%s/\d+/\d+/\d+)")+"Previous"),
|
|
|
|
help='Index format: yyyy/mm/dd',
|
2012-06-20 19:58:13 +00:00
|
|
|
namer=namer)
|
|
|
|
)
|
|
|
|
|
2012-10-12 19:47:57 +00:00
|
|
|
# http://www.gocomics.com/features
|
|
|
|
# XXX
|
|
|
|
|
|
|
|
# http://www.gocomics.com/explore/editorial_list
|
|
|
|
# XXX
|
|
|
|
|
|
|
|
# http://www.gocomics.com/explore/sherpa_list
|
|
|
|
# XXX
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
acaseinpoint = comicsDotCom('acaseinpoint', 'comics')
|
|
|
|
agnes = comicsDotCom('agnes', 'creators')
|
|
|
|
alleyoop = comicsDotCom('alleyoop', 'comics')
|
|
|
|
andycapp = comicsDotCom('andycapp', 'creators')
|
|
|
|
arlonjanis = comicsDotCom('arlonjanis', 'comics')
|
|
|
|
ballardst = comicsDotCom('ballardst', 'creators')
|
|
|
|
barkeaterlake = comicsDotCom('barkeaterlake', 'comics')
|
|
|
|
bc = comicsDotCom('bc', 'creators')
|
|
|
|
ben = comicsDotCom('ben', 'comics')
|
|
|
|
betty = comicsDotCom('betty', 'comics')
|
|
|
|
bignate = comicsDotCom('bignate', 'comics')
|
|
|
|
bonanas = comicsDotCom('bonanas', 'wash')
|
|
|
|
bornloser = comicsDotCom('bornloser', 'comics')
|
|
|
|
buckets = comicsDotCom('buckets', 'comics')
|
|
|
|
candorville = comicsDotCom('candorville', 'wash')
|
|
|
|
cheapthrills = comicsDotCom('cheapthrills', 'wash')
|
|
|
|
chickweed = comicsDotCom('chickweed', 'comics')
|
|
|
|
committed = comicsDotCom('committed', 'comics')
|
|
|
|
dilbert = comicsDotCom('dilbert', 'comics')
|
|
|
|
drabble = comicsDotCom('drabble', 'comics')
|
|
|
|
fatcats = comicsDotCom('fatcats', 'comics')
|
|
|
|
ferdnand = comicsDotCom('ferdnand', 'comics')
|
|
|
|
flightdeck = comicsDotCom('flightdeck', 'creators')
|
|
|
|
floandfriends = comicsDotCom('floandfriends', 'creators')
|
|
|
|
franknernest = comicsDotCom('franknernest', 'comics')
|
|
|
|
frazz = comicsDotCom('frazz', 'comics')
|
|
|
|
geech = comicsDotCom('geech', 'comics')
|
|
|
|
genepool = comicsDotCom('genepool', 'wash')
|
|
|
|
getfuzzy = comicsDotCom('getfuzzy', 'comics')
|
|
|
|
gofish = comicsDotCom('gofish', 'comics')
|
|
|
|
graffiti = comicsDotCom('graffiti', 'comics')
|
|
|
|
grandave = comicsDotCom('grandave', 'comics')
|
|
|
|
grizzwells = comicsDotCom('grizzwells', 'comics')
|
|
|
|
heathcliff = comicsDotCom('heathcliff', 'creators')
|
|
|
|
hedge = comicsDotCom('hedge', 'comics')
|
|
|
|
herbnjamaal = comicsDotCom('herbnjamaal', 'creators')
|
|
|
|
herman = comicsDotCom('herman', 'comics')
|
|
|
|
humblestumble = comicsDotCom('humblestumble', 'comics')
|
|
|
|
janesworld = comicsDotCom('janesworld', 'comics')
|
|
|
|
jumpstart = comicsDotCom('jumpstart', 'comics')
|
|
|
|
kitncarlyle = comicsDotCom('kitncarlyle', 'comics')
|
|
|
|
liberty = comicsDotCom('liberty', 'creators')
|
|
|
|
lilabner = comicsDotCom('lilabner', 'comics')
|
|
|
|
luann = comicsDotCom('luann', 'comics')
|
|
|
|
marmaduke = comicsDotCom('marmaduke', 'comics')
|
|
|
|
meg = comicsDotCom('meg', 'comics')
|
|
|
|
moderatelyconfused = comicsDotCom('moderatelyconfused', 'comics')
|
|
|
|
momma = comicsDotCom('momma', 'creators')
|
|
|
|
monty = comicsDotCom('monty', 'comics')
|
|
|
|
motley = comicsDotCom('motley', 'comics')
|
|
|
|
nancy = comicsDotCom('nancy', 'comics')
|
|
|
|
naturalselection = comicsDotCom('naturalselection', 'creators')
|
|
|
|
offthemark = comicsDotCom('offthemark', 'comics')
|
|
|
|
onebighappy = comicsDotCom('onebighappy', 'creators')
|
|
|
|
othercoast = comicsDotCom('othercoast', 'creators')
|
|
|
|
pcnpixel = comicsDotCom('pcnpixel', 'wash')
|
|
|
|
peanuts = comicsDotCom('peanuts', 'comics')
|
|
|
|
pearls = comicsDotCom('pearls', 'comics')
|
|
|
|
pibgorn = comicsDotCom('pibgorn', 'comics')
|
|
|
|
pickles = comicsDotCom('pickles', 'wash')
|
|
|
|
raisingduncan = comicsDotCom('raisingduncan', 'comics')
|
|
|
|
reality = comicsDotCom('reality', 'comics')
|
|
|
|
redandrover = comicsDotCom('redandrover', 'wash')
|
|
|
|
ripleys = comicsDotCom('ripleys', 'comics')
|
|
|
|
roseisrose = comicsDotCom('roseisrose', 'comics')
|
|
|
|
rubes = comicsDotCom('rubes', 'creators')
|
|
|
|
rudypark = comicsDotCom('rudypark', 'comics')
|
|
|
|
shirleynson = comicsDotCom('shirleynson', 'comics')
|
|
|
|
soup2nutz = comicsDotCom('soup2nutz', 'comics')
|
|
|
|
speedbump = comicsDotCom('speedbump', 'creators')
|
|
|
|
spotthefrog = comicsDotCom('spotthefrog', 'comics')
|
|
|
|
strangebrew = comicsDotCom('strangebrew', 'creators')
|
|
|
|
sunshineclub = comicsDotCom('sunshineclub', 'comics')
|
|
|
|
tarzan = comicsDotCom('tarzan', 'comics')
|
|
|
|
thatslife = comicsDotCom('thatslife', 'wash')
|
|
|
|
wizardofid = comicsDotCom('wizardofid', 'creators')
|
|
|
|
workingdaze = comicsDotCom('workingdaze', 'comics')
|
|
|
|
workingitout = comicsDotCom('workingitout', 'creators')
|
|
|
|
|
|
|
|
|
|
|
|
def creators(name, shortname):
|
|
|
|
return type('Creators_%s' % name,
|
|
|
|
(_BasicScraper,),
|
|
|
|
dict(
|
|
|
|
name='Creators/' + name,
|
|
|
|
latestUrl='http://www.creators.com/comics_show.cfm?ComicName=%s' % (shortname,),
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl=None,
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch=compile(r'<img alt="[^"]+" src="(\d{4}/.+?/.+?\..+?)">'),
|
|
|
|
prevSearch=compile(r'<a href="(comics_show\.cfm\?next=\d+&ComicName=.+?)" Title="Previous Comic"'),
|
|
|
|
help='Indexing unsupported')
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
arc = creators('Archie', 'arc')
|
|
|
|
shg = creators('AskShagg', 'shg')
|
|
|
|
hev = creators('ForHeavensSake', 'hev')
|
|
|
|
rug = creators('Rugrats', 'rug')
|
|
|
|
sou = creators('StateOfTheUnion', 'sou')
|
|
|
|
din = creators('TheDinetteSet', 'din')
|
|
|
|
lil = creators('TheMeaningOfLila', 'lil')
|
|
|
|
wee = creators('WeePals', 'wee')
|
|
|
|
zhi = creators('ZackHill', 'zhi')
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CyanideAndHappiness(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.explosm.net/comics'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.explosm.net/comics/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img alt="Cyanide and Happiness, a daily webcomic" src="(http:\/\/www\.explosm\.net/db/files/Comics/\w+/\S+\.\w+)"')
|
|
|
|
prevSearch = compile(r'<a href="(/comics/\d+/?)">< Previous</a>')
|
|
|
|
help = 'Index format: n (unpadded)'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CrimsonDark(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.davidcsimon.com/crimsondark/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.davidcsimon.com/crimsondark/index.php?view=comic&strip_id=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'src="(.+?strips/.+?)"')
|
|
|
|
prevSearch = compile(r'<a href=[\'"](/crimsondark/index\.php\?view=comic&strip_id=\d+)[\'"]><img src=[\'"]themes/cdtheme/images/active_prev.png[\'"]')
|
|
|
|
help = 'Index format: n (unpadded)'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CrimesOfCybeleCity(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.pulledpunches.com/crimes/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.beaglespace.com/pulledpunches/crimes/?p=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://www\.beaglespace\.com/pulledpunches/crimes/comics/[^"]+)"')
|
|
|
|
prevSearch = compile(r'<a href="(http://www\.beaglespace\.com/pulledpunches/crimes/\?p=\d+)"><img src="back1\.gif"')
|
|
|
|
help = 'Index format: nn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CatsAndCameras(_BasicScraper):
|
|
|
|
latestUrl = 'http://catsncameras.com/cnc/'
|
2012-11-14 19:23:30 +00:00
|
|
|
stripUrl = latestUrl + '?p=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://catsncameras.com/cnc/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<div class="nav-previous"><a href="(http://catsncameras.com/cnc/.+?)">')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CowboyJedi(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.cowboyjedi.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.cowboyjedi.com/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://www.cowboyjedi.com/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<a href="(http://www.cowboyjedi.com/.+?)" class="navi navi-prev"')
|
|
|
|
help = 'Index format: yyyy/mm/dd/strip-name'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CasuallyKayla(_BasicScraper):
|
|
|
|
latestUrl = 'http://casuallykayla.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://casuallykayla.com/?p=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://casuallykayla.com/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<div class="nav-previous"><a href="(.+?)">')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Collar6(_BasicScraper):
|
|
|
|
latestUrl = 'http://collar6.com/'
|
2012-11-14 05:22:08 +00:00
|
|
|
stripUrl = 'http://collar6.com/archive/%s'
|
2012-11-13 05:51:54 +00:00
|
|
|
imageSearch = compile(tagre("img", "src", r'(http://collar6\.com/wp-content/webcomic/collar6/[^"]+)'))
|
|
|
|
prevSearch = compile(tagre("a", "href", r'(http://collar6\.com/archive/[^"]+)', after="previous"))
|
2012-11-14 05:22:08 +00:00
|
|
|
help = 'Index format: <name>'
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Chester5000XYV(_BasicScraper):
|
|
|
|
latestUrl = 'http://jessfink.com/Chester5000XYV/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://jessfink.com/Chester5000XYV/?p=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://jessfink.com/Chester5000XYV/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<a href="(.+?)"><span class="prev">')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CalamitiesOfNature(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.calamitiesofnature.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.calamitiesofnature.com/archive/?c=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<IMG SRC="(archive/\d+.+?|http://www.calamitiesofnature.com/archive/\d+.+?)"')
|
|
|
|
prevSearch = compile(r'<a id="previous" href="(http://www.calamitiesofnature.com/archive/\?c\=\d+)">')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Champ2010(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.jedcollins.com/champ2010/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://jedcollins.com/champ2010/?p=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://jedcollins.com/champ2010/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<div class="nav-previous"><a href="(http://jedcollins.com/champ2010/.+?)"')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Chucklebrain(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.chucklebrain.com/main.php'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.chucklebrain.com/main.php?img=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(/images/strip.+?)"')
|
|
|
|
prevSearch = compile(r'<a href=\'(/main.php\?img\=\d+)\'><img src=\'/images/previous.jpg\'')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CompanyY(_BasicScraper):
|
|
|
|
latestUrl = 'http://company-y.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://company-y.com/%s/'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://company-y.com/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<div class="nav-previous"><a href="(http://company-y.com/.+?)"')
|
|
|
|
help = 'Index format: yyyy/mm/dd/strip-name'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CorydonCafe(_BasicScraper):
|
|
|
|
starter = bounceStarter('http://corydoncafe.com/', compile(r' href="(\./comic-\d+.html)">Next></a>'))
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://corydoncafe.com/comic-%s.html'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src=\'(\./comics/.+?)\' ')
|
|
|
|
prevSearch = compile(r' href="(\./comic-\d+.html)"><Previous</a>')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def namer(cls, imageUrl, pageUrl):
|
|
|
|
return pageUrl.split('/')[-1].split('.')[0]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CraftedFables(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.craftedfables.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.caf-fiends.net/craftedfables/?p=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://www.caf-fiends.net/craftedfables/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<a href="(http://www.caf-fiends.net/craftedfables/.+?)"><span class="prev">')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Currhue(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.currhue.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.currhue.com/?p=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://www.currhue.com/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<div class="nav-previous"><a href="(http://www.currhue.com/.+?)"')
|
|
|
|
help = 'Index format: nnn'
|