dosage/dosagelib/plugins/r.py

# -*- coding: iso-8859-1 -*-
# Copyright (C) 2004-2005 Tristan Seligmann and Jonathan Jacobs
# Copyright (C) 2012 Bastian Kleineidam

from re import compile
from ..scraper import _BasicScraper
from ..helpers import bounceStarter
from ..util import tagre


class RadioactivePanda(_BasicScraper):
    latestUrl = 'http://www.radioactivepanda.com/'
    stripUrl = latestUrl + 'comic/%s'
    imageSearch = compile(r'<img src="(/Assets/.*?)".+?"comicimg"')
    prevSearch = compile(r'<a href="(/comic/.*?)".+?previous_btn')
    help = 'Index format: n (no padding)'


# XXX add other comics at http://petitesymphony.com/comics/
class Rascals(_BasicScraper):
    latestUrl = 'http://rascals.petitesymphony.com/'
    stripUrl = latestUrl + '/comic/rascals-pg-%s/'
    imageSearch = compile(tagre("img", "src", r'(http://rascals\.petitesymphony\.com/files/comics/[^"]+)'))
    prevSearch = compile(tagre("a", "href", r'(http://rascals\.petitesymphony\.com/comic/[^"]+)', after="Previous"))
    help = 'Index format: num'


class RealLife(_BasicScraper):
    latestUrl = 'http://www.reallifecomics.com/'
    stripUrl = latestUrl + 'archive/%s.html'
    imageSearch = compile(tagre("img", "src", r'(/comics/[^"]+)'))
    prevSearch = compile(tagre("a", "href", r'(/archive/\d+.html)') + tagre("img", "src", r'/images/nav_prev\.png'))
    help = 'Index format: yymmdd)'


class RedString(_BasicScraper):
    latestUrl = 'http://www.redstring.strawberrycomics.com/'
    stripUrl = latestUrl + 'index.php?id=%s'
    imageSearch = compile(tagre("img", "src", r'("comics/[^"]+)'))
    prevSearch = compile(tagre("a", "href", r'(/index\.php\?id=\d+)', after="prev"))
    help = 'Index format: nnn'


class Roza(_BasicScraper):
    latestUrl = 'http://www.junglestudio.com/roza/index.php'
    stripUrl = latestUrl + '?date=%s'
    imageSearch = compile(r'<img src="(pages/.+?)"')
    prevSearch = compile(r'<a href="(index.php\?date=.+?)">[^>].+?navtable_01.gif')
    help = 'Index format: yyyy-mm-dd'


class RedMeat(_BasicScraper):
    starter = bounceStarter('http://www.redmeat.com/redmeat/current/index.html', compile(r'<a href="(\.\./\d{4}-\d{2}-\d{2}/index\.html)">next</a>'))
    stripUrl = 'http://www.redmeat.com/redmeat/%s/index.html'
    imageSearch = compile(r'<img src="(index-1\.gif)" width="\d+" height="\d+" [^>]*>')
    prevSearch = compile(r'<a href="(\.\./\d{4}-\d{2}-\d{2}/index\.html)">previous</a>')
    help = 'Index format: yyyy-mm-dd'

    @classmethod
    def namer(cls, imageUrl, pageUrl):
        return imageUrl.split('/')[-2]
Updated copyright for all source files. 2012-06-20 20:41:04 +00:00			`# -- coding: iso-8859-1 --`
			`# Copyright (C) 2004-2005 Tristan Seligmann and Jonathan Jacobs`
Fix some comics. 2012-11-21 20:57:26 +00:00			`# Copyright (C) 2012 Bastian Kleineidam`
Initial commit to Github. 2012-06-20 19:58:13 +00:00
Fix some comics. 2012-11-21 20:57:26 +00:00			`from re import compile`
A lot of refactoring. 2012-10-11 10:03:12 +00:00			`from ..scraper import _BasicScraper`
			`from ..helpers import bounceStarter`
Fix some comics. 2012-11-21 20:57:26 +00:00			`from ..util import tagre`
Initial commit to Github. 2012-06-20 19:58:13 +00:00

			`class RadioactivePanda(_BasicScraper):`
			`latestUrl = 'http://www.radioactivepanda.com/'`
Updated documentation and fix some comics. 2012-11-20 17:53:53 +00:00			`stripUrl = latestUrl + 'comic/%s'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`imageSearch = compile(r'<img src="(/Assets/.*?)".+?"comicimg"')`
			`prevSearch = compile(r'<a href="(/comic/.*?)".+?previous_btn')`
			`help = 'Index format: n (no padding)'`


Fix some comics. 2012-11-21 20:57:26 +00:00			`# XXX add other comics at http://petitesymphony.com/comics/`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`class Rascals(_BasicScraper):`
Fix some comics. 2012-11-21 20:57:26 +00:00			`latestUrl = 'http://rascals.petitesymphony.com/'`
			`stripUrl = latestUrl + '/comic/rascals-pg-%s/'`
			`imageSearch = compile(tagre("img", "src", r'(http://rascals\.petitesymphony\.com/files/comics/[^"]+)'))`
			`prevSearch = compile(tagre("a", "href", r'(http://rascals\.petitesymphony\.com/comic/[^"]+)', after="Previous"))`
			`help = 'Index format: num'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00

			`class RealLife(_BasicScraper):`
			`latestUrl = 'http://www.reallifecomics.com/'`
Fix some comics. 2012-11-21 20:57:26 +00:00			`stripUrl = latestUrl + 'archive/%s.html'`
			`imageSearch = compile(tagre("img", "src", r'(/comics/[^"]+)'))`
			`prevSearch = compile(tagre("a", "href", r'(/archive/\d+.html)') + tagre("img", "src", r'/images/nav_prev\.png'))`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`help = 'Index format: yymmdd)'`


			`class RedString(_BasicScraper):`
			`latestUrl = 'http://www.redstring.strawberrycomics.com/'`
Fix some comics. 2012-11-21 20:57:26 +00:00			`stripUrl = latestUrl + 'index.php?id=%s'`
			`imageSearch = compile(tagre("img", "src", r'("comics/[^"]+)'))`
			`prevSearch = compile(tagre("a", "href", r'(/index\.php\?id=\d+)', after="prev"))`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`help = 'Index format: nnn'`


			`class Roza(_BasicScraper):`
			`latestUrl = 'http://www.junglestudio.com/roza/index.php'`
Updated documentation and fix some comics. 2012-11-20 17:53:53 +00:00			`stripUrl = latestUrl + '?date=%s'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`imageSearch = compile(r'<img src="(pages/.+?)"')`
			`prevSearch = compile(r'<a href="(index.php\?date=.+?)">[^>].+?navtable_01.gif')`
			`help = 'Index format: yyyy-mm-dd'`


			`class RedMeat(_BasicScraper):`
			`starter = bounceStarter('http://www.redmeat.com/redmeat/current/index.html', compile(r'<a href="(\.\./\d{4}-\d{2}-\d{2}/index\.html)">next</a>'))`
Rename imageUrl to stripUrl. 2012-11-13 18:10:19 +00:00			`stripUrl = 'http://www.redmeat.com/redmeat/%s/index.html'`
Initial commit to Github. 2012-06-20 19:58:13 +00:00			`imageSearch = compile(r'<img src="(index-1\.gif)" width="\d+" height="\d+" [^>]*>')`
			`prevSearch = compile(r'<a href="(\.\./\d{4}-\d{2}-\d{2}/index\.html)">previous</a>')`
			`help = 'Index format: yyyy-mm-dd'`

			`@classmethod`
			`def namer(cls, imageUrl, pageUrl):`
			`return imageUrl.split('/')[-2]`