2012-06-20 20:41:04 +00:00
|
|
|
# -*- coding: iso-8859-1 -*-
|
|
|
|
# Copyright (C) 2004-2005 Tristan Seligmann and Jonathan Jacobs
|
2012-06-20 19:58:13 +00:00
|
|
|
from re import compile
|
|
|
|
|
2012-10-11 19:32:15 +00:00
|
|
|
from ..util import tagre
|
2012-10-11 10:03:12 +00:00
|
|
|
from ..scraper import _BasicScraper
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
|
|
|
|
class BadlyDrawnKitties(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.badlydrawnkitties.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.badlydrawnkitties.com/new/%s.html'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(/new/.+?)">')
|
2012-11-13 18:12:28 +00:00
|
|
|
prevSearch = compile(tagre("a", "href", r'(/[^"]+)') + tagre("img", "src", r'/images/previous\.gif'))
|
2012-06-20 19:58:13 +00:00
|
|
|
help = 'Index format: n (unpadded)'
|
|
|
|
|
|
|
|
|
|
|
|
class Bardsworth(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.bardsworth.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.bardsworth.com/archive.php?p=s%'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'(strips/.+?)"')
|
|
|
|
prevSearch = compile(r'"(http.+?)".+?/prev')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
class BetterDays(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.jaynaylor.com/betterdays/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.jaynaylor.com/betterdays/archives/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src=(/betterdays/comic/.+?)>')
|
|
|
|
prevSearch = compile(r'<a href="(.+)">« Previous')
|
|
|
|
help = 'Index format: yyyy/mm/<your guess>.html'
|
|
|
|
|
|
|
|
|
|
|
|
class BetterYouThanMe(_BasicScraper):
|
|
|
|
latestUrl = 'http://betteryouthanme.net/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://betteryouthanme.net/archive.php?date=%s.gif'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'"(comics/.+?)"')
|
|
|
|
prevSearch = compile(r'"(archive.php\?date=.+?)">.+?previous')
|
|
|
|
help = 'Index format: yyyymmdd'
|
|
|
|
|
|
|
|
|
|
|
|
class BiggerThanCheeses(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.biggercheese.com'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.biggercheese.com/index.php?comic=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'src="(comics/.+?)" alt')
|
|
|
|
prevSearch = compile(r'"(index.php\?comic=.+?)".+?_back')
|
|
|
|
help = 'Index format: n (unpadded)'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BizarreUprising(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.bizarreuprising.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.bizarreuprising.com/view/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(comic/[^"]+)"')
|
|
|
|
prevSearch = compile(r'<a href="(view/\d+/[^"]+)"><img src="images/b_prev\.gif"')
|
|
|
|
help = 'Index format: n/name'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Blip(_BasicScraper):
|
|
|
|
latestUrl = 'http://blipcomic.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://blipcomic.com/index.php?strip_id=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'(istrip_files/strips/.+?)"')
|
|
|
|
prevSearch = compile(r'First.+?"(index.php\?strip_id=.+?)".+?prev')
|
|
|
|
help = 'Index format: n'
|
|
|
|
|
|
|
|
|
|
|
|
class BlueCrashKit(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.bluecrashkit.com/cheese/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.bluecrashkit.com/cheese/node/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'(/cheese/files/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'(/cheese/node/.+?)".+?previous')
|
|
|
|
help = 'Index format: non'
|
|
|
|
|
|
|
|
|
|
|
|
class BMovieComic(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.bmoviecomic.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.bmoviecomic.com/?cid=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'"(comics/.+?)"')
|
|
|
|
prevSearch = compile(r'(\?cid=.+?)".+?Prev')
|
|
|
|
help = 'Index format: n'
|
|
|
|
|
|
|
|
|
|
|
|
### With BratHalla there is no 'previous' link at comic 360
|
|
|
|
### You will need to use
|
|
|
|
### mainline -c BratHalla:360-backup-dad-unstable-plans/
|
|
|
|
### to get earlier comics
|
|
|
|
class BratHalla(_BasicScraper):
|
|
|
|
latestUrl = 'http://brat-halla.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://brat-halla.com/comic/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r"(/comics/.+?)' target='_blank")
|
|
|
|
prevSearch = compile(r'headernav2".+?"(http.+?)"')
|
|
|
|
help = 'Index format: non'
|
|
|
|
|
|
|
|
|
|
|
|
class Brink(_BasicScraper):
|
|
|
|
latestUrl = 'http://paperfangs.com/brink/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://paperfangs.com/brink/?p=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'/(comics/.+?)"')
|
|
|
|
prevSearch = compile(r'previous.+?/brink/(.+?)".+?Previous')
|
|
|
|
help = 'Index format: non'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BoredAndEvil(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.boredandevil.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.boredandevil.com/archive.php?date=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(strips/.+?)"')
|
|
|
|
prevSearch = compile(r'First Comic.+<a href="(.+?)".+previous-on.gif')
|
|
|
|
help = 'Index format: yyyy-mm-dd'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BoyOnAStickAndSlither(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.boasas.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.boasas.com/?c=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'"(boasas/\d+\..+?)"')
|
|
|
|
prevSearch = compile(r'<a href="(.+?)"><img src="images/left_20.png"')
|
|
|
|
help = 'Index format: n (unpadded)'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class ButternutSquash(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.butternutsquash.net/'
|
2012-11-14 05:22:08 +00:00
|
|
|
stripUrl = 'http://www.butternutsquash.net/%s'
|
2012-11-13 05:51:54 +00:00
|
|
|
imageSearch = compile(tagre("img", "src", r'(http://www\.butternutsquash\.net/comics/[^"]+)'))
|
2012-11-13 18:12:28 +00:00
|
|
|
prevSearch = compile(tagre("a", "href", r'(http://www\.butternutsquash\.net/[^"]+)', after="prev"))
|
2012-06-20 19:58:13 +00:00
|
|
|
help = 'Index format: yyyy/mm/dd/strip-name-author-name'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def blankLabel(name, baseUrl):
|
|
|
|
return type('BlankLabel_%s' % name,
|
|
|
|
(_BasicScraper,),
|
|
|
|
dict(
|
|
|
|
name='BlankLabel/' + name,
|
|
|
|
latestUrl=baseUrl,
|
2012-11-14 19:23:30 +00:00
|
|
|
stripUrl=baseUrl+'d/%s.html',
|
2012-10-11 19:32:15 +00:00
|
|
|
imageSearch=compile(tagre("img", "src", r'(/comic[s|/][^"]+)')),
|
2012-10-12 19:47:57 +00:00
|
|
|
prevSearch=compile(tagre("a", "href", r'[^"]*(/d/\d+\.s?html)')+r"[^>]+/images/(?:nav_02|previous_day)\.gif"),
|
2012-10-11 19:32:15 +00:00
|
|
|
#prevSearch=compile(r'(?:"([^"]*(?:/d/[^"\r\n]*)|(?:/strip/.+?))")(?:(?:.{43}starshift_back.gif)|(?:.+?cxn_previous)|(?:.{43}previous)|(?:[^<>]*>[^<>]*<[^<>]*previous)|(?:.*?back_button)|(?:.*?comicnav-previous))'),
|
2012-06-20 19:58:13 +00:00
|
|
|
help='Index format: yyyymmdd')
|
|
|
|
)
|
|
|
|
|
|
|
|
|
2012-11-14 05:22:08 +00:00
|
|
|
checkerboard = blankLabel('CheckerboardNightmare', 'http://www.checkerboardnightmare.com/')
|
2012-06-20 19:58:13 +00:00
|
|
|
courtingDisaster = blankLabel('CourtingDisaster', 'http://www.courting-disaster.com/')
|
|
|
|
evilInc = blankLabel('EvilInc', 'http://www.evil-comic.com/')
|
|
|
|
greystoneInn = blankLabel('GreystoneInn', 'http://www.greystoneinn.net/')
|
|
|
|
itsWalky = blankLabel('ItsWalky', 'http://www.itswalky.com/')
|
|
|
|
# one strip name starts with %20
|
|
|
|
#krazyLarry = blankLabel('KrazyLarry', 'http://www.krazylarry.com/')
|
|
|
|
melonpool = blankLabel('Melonpool', 'http://www.melonpool.com/')
|
|
|
|
# strip names = index.php
|
|
|
|
#realLife = blankLabel('RealLife', 'http://www.reallifecomics.com/')
|
|
|
|
schlockMercenary = blankLabel('SchlockMercenary', 'http://www.schlockmercenary.com/')
|
|
|
|
# hosted on ComicsDotCom
|
|
|
|
#sheldon = blankLabel('Sheldon', 'http://www.sheldoncomics.com/')
|
|
|
|
shortpacked = blankLabel('Shortpacked', 'http://www.shortpacked.com/')
|
|
|
|
starslipCrisis = blankLabel('StarslipCrisis', 'http://www.starslipcrisis.com/')
|
|
|
|
uglyHill = blankLabel('UglyHill', 'http://www.uglyhill.com/')
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BeePower(_BasicScraper):
|
|
|
|
latestUrl = 'http://comicswithoutviolence.com/d/20080713.html'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://comicswithoutviolence.com/d/%s.html'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'src="(/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'(\d+\.html)"><img[^>]+?src="/images/previous_day.png"')
|
|
|
|
help = 'Index format: yyyy/mm/dd'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BlankIt(_BasicScraper):
|
|
|
|
latestUrl = 'http://blankitcomics.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://blankitcomics.com/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://blankitcomics.com/bicomics/.+?)"')
|
|
|
|
prevSearch = compile(r'<a href="([^"]+)" rel="prev">')
|
|
|
|
help = 'Index format: yyyy/mm/dd/name'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BobWhite(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.bobwhitecomics.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.bobwhitecomics.com/?webcomic_post=%s'
|
2012-10-11 19:32:15 +00:00
|
|
|
imageSearch = compile(tagre("img", "src", r"(http://www\.bobwhitecomics\.com/wp/wp-content/webcomic/untitled/\d+.jpg)"))
|
|
|
|
prevSearch = compile(tagre("a", "href", "(http://www\.bobwhitecomics\.com/\?webcomic_post=\d+)")+r'[^"]+Previous')
|
2012-06-20 19:58:13 +00:00
|
|
|
help = 'Index format: yyyymmdd'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BigFatWhale(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.bigfatwhale.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.bigfatwhale.com/archives/bfw_%s.htm'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(archives/bfw_.+?|bfw_.+?)"')
|
|
|
|
prevSearch = compile(r' HREF="(.+?)" TARGET="_top" TITLE="Previous Cartoon"')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BadassMuthas(_BasicScraper):
|
|
|
|
latestUrl = 'http://badassmuthas.com/pages/comic.php'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://badassmuthas.com/pages/comic.php?%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(/images/comicsissue.+?)"')
|
|
|
|
prevSearch = compile(r'<a href="(.+?)"><img src="/images/comicsbuttonBack.gif" ')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Boozeathon4Billion(_BasicScraper):
|
|
|
|
latestUrl = 'http://boozeathon4billion.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://boozeathon4billion.com/comics/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://boozeathon4billion.com/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<a href="(.+?)"[^>]+?>Previous</a>')
|
|
|
|
help = 'Index format: (sometimes chapternumber/)-yyyy-mm-dd/stripname'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BrightlyWound(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.brightlywound.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.brightlywound.com/?comic=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src=\'(comic/.+?)\'')
|
|
|
|
prevSearch = compile(r'<div id=\'navback\'><a href=\'(\?comic\=\d+)\'><img src=\'images/previous.png\'')
|
|
|
|
help = 'Index format: nnn'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BlueCrashKit(_BasicScraper):
|
|
|
|
latestUrl = 'http://robhamm.com/bluecrashkit'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://robhamm.com/comics/blue-crash-kit/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'src="(http://robhamm.com/sites/default/files/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<li class="previous"><a href="(.+?)">')
|
|
|
|
help = 'Index format: yyyy-mm-dd'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BloodBound(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.bloodboundcomic.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.bloodboundcomic.com/d/%s.html'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r' src="(/comics/.+?)"')
|
|
|
|
prevSearch = compile(r' <a href="(/d/.+?)"><img[^>]+?src="/images/previous_day.jpg"')
|
|
|
|
help = 'Index format: yyyymmdd'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BookOfBiff(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.thebookofbiff.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.thebookofbiff.com/%s'
|
2012-11-13 18:12:28 +00:00
|
|
|
imageSearch = compile(tagre("img", "src", r'([^"]+/comics/[^"]+)'))
|
|
|
|
prevSearch = compile(tagre("a", "href", r'([^"]+)', after="Previous"))
|
2012-06-20 19:58:13 +00:00
|
|
|
help = 'Index format: yyyy/mm/dd/stripnum-strip-name'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BillyTheDunce(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.duncepress.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.duncepress.com/%s/'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://www.duncepress.com/comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<div class="nav-previous"><a href="(http://www.duncepress.com/[^"]+)" rel="prev">')
|
|
|
|
help = 'Index format: yyyy/mm/strip-name'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BackwaterPlanet(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.backwaterplanet.com/current.htm'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.backwaterplanet.com/archive/bwp%s.htm'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(/images/comic/bwp.+?)">')
|
|
|
|
prevSearch = compile(r'<a href="(/archive/bwp.+?)"><img src="(images/Previous.jpg|/images/Previous.jpg)"')
|
|
|
|
help = 'Index format: yymmdd'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Baroquen(_BasicScraper):
|
|
|
|
latestUrl = 'http://www.baroquencomics.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://www.baroquencomics.com/2010/01/04/the-man-from-omi/'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(http://www.baroquencomics.com/Comics/.+?)"')
|
|
|
|
prevSearch = compile(r'<a href="(http://www.baroquencomics.com/.+?)" rel="prev">')
|
|
|
|
help = 'Index format: yyyy/mm/dd/strip-name'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BetweenFailures(_BasicScraper):
|
|
|
|
latestUrl = 'http://betweenfailures.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://betweenfailures.com/%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src=\'(http://betweenfailures.com/comics/.+?)\'>')
|
|
|
|
prevSearch = compile(r'<a href="(http://betweenfailures.com/.+?)">« Previous</a>')
|
|
|
|
help = 'Index format: yyyy/mm/dd/stripnum-strip-name'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class BillyTheBeaker(_BasicScraper):
|
|
|
|
latestUrl = 'http://billy.defectivejunk.com/'
|
2012-11-13 18:10:19 +00:00
|
|
|
stripUrl = 'http://billy.defectivejunk.com/index.php?strip=%s'
|
2012-06-20 19:58:13 +00:00
|
|
|
imageSearch = compile(r'<img src="(bub\d+_\d+.+?)"')
|
|
|
|
prevSearch = compile(r' <a href="(index.php\?strip\=.+?)" title="Previous strip">')
|
|
|
|
help = 'Index format: nnn'
|