dosage/dosagelib/plugins/smackjeeves.py

# -*- coding: iso-8859-1 -*-
# Copyright (C) 2004-2005 Tristan Seligmann and Jonathan Jacobs
# Copyright (C) 2012 Bastian Kleineidam
from re import compile
from ..scraper import make_scraper
from ..helpers import bounceStarter
from ..util import tagre

_imageSearch = compile(tagre("img", "src", r'(http://(?:www|img2)\.smackjeeves\.com/images/uploaded/comics/[^"]+)'))
_linkSearch = tagre("a", "href", r'([^"]*/comics/\d+/[^"]*)')
_prevSearch = compile(_linkSearch + '(?:<img[^>]*alt="< Previous"|&lt; Back)')
_nextSearch = compile(_linkSearch + '(?:<img[^>]*alt="Next >"|Next &gt;)')

def add(name):
    classname = 'SmackJeeves/' + name
    # XXX mature content can be viewed directly with:
    # http://www.smackjeeves.com/mature.php?ref=<percent-encoded-url>
    baseUrl = 'http://%s.smackjeeves.com/comics/' % name

    @classmethod
    def namer(cls, imageUrl, pageUrl):
        return pageUrl.split('/')[-2]

    globals()[classname] = make_scraper(classname,
        starter=bounceStarter(baseUrl, _nextSearch),
        stripUrl = baseUrl + '%s/',
        imageSearch = _imageSearch,
        prevSearch = _prevSearch,
        help = 'Index format: nnnn (some increasing number)',
        namer = namer,
    )


add('20galaxies')
add('axe13')
add('beartholomew')
add('bliss')
add('durian')
add('heard')
add('mpmcomic')
add('nlmo-project')
add('paranoidloyd')
add('thatdreamagain')
add('wowcomics')
Fix some comics. 2012-11-21 20:57:26 +00:00			`# -- coding: iso-8859-1 --`
			`# Copyright (C) 2004-2005 Tristan Seligmann and Jonathan Jacobs`
			`# Copyright (C) 2012 Bastian Kleineidam`
			`from re import compile`
Fix some comics. 2012-11-26 06:13:32 +00:00			`from ..scraper import make_scraper`
Fix some comics. 2012-11-21 20:57:26 +00:00			`from ..helpers import bounceStarter`
			`from ..util import tagre`

Fix some comics. 2012-12-02 17:35:06 +00:00			`_imageSearch = compile(tagre("img", "src", r'(http://(?:www\|img2)\.smackjeeves\.com/images/uploaded/comics/[^"]+)'))`
			`_linkSearch = tagre("a", "href", r'([^"]/comics/\d+/[^"])')`
			`_prevSearch = compile(_linkSearch + '(?:<img[^>]*alt="< Previous"\|< Back)')`
			`_nextSearch = compile(_linkSearch + '(?:<img[^>]*alt="Next >"\|Next >)')`
Fix some comics. 2012-11-21 20:57:26 +00:00
Fix some comics. 2012-11-26 06:13:32 +00:00			`def add(name):`
			`classname = 'SmackJeeves/' + name`
Fix some comics. 2012-11-21 20:57:26 +00:00			`# XXX mature content can be viewed directly with:`
			`# http://www.smackjeeves.com/mature.php?ref=<percent-encoded-url>`
Fix some comics. 2012-11-26 06:13:32 +00:00			`baseUrl = 'http://%s.smackjeeves.com/comics/' % name`
Fix some comics. 2012-11-21 20:57:26 +00:00
Fix some comics. 2012-11-26 06:13:32 +00:00			`@classmethod`
			`def namer(cls, imageUrl, pageUrl):`
			`return pageUrl.split('/')[-2]`
Fix some comics. 2012-11-21 20:57:26 +00:00
Fix some comics. 2012-11-26 06:13:32 +00:00			`globals()[classname] = make_scraper(classname,`
Fix some comics. 2012-12-02 17:35:06 +00:00			`starter=bounceStarter(baseUrl, _nextSearch),`
			`stripUrl = baseUrl + '%s/',`
Add comic scripts, add fixes and other stuff. 2012-11-28 17:15:12 +00:00			`imageSearch = _imageSearch,`
			`prevSearch = _prevSearch,`
Fix some comics. 2012-11-26 06:13:32 +00:00			`help = 'Index format: nnnn (some increasing number)',`
			`namer = namer,`
			`)`
Fix some comics. 2012-11-21 20:57:26 +00:00

Fix some comics. 2012-11-26 06:13:32 +00:00			`add('20galaxies')`
			`add('axe13')`
			`add('beartholomew')`
			`add('bliss')`
			`add('durian')`
			`add('heard')`
			`add('mpmcomic')`
			`add('nlmo-project')`
			`add('paranoidloyd')`
			`add('thatdreamagain')`
			`add('wowcomics')`