From ebe98bc8ba04718ad9dd8f0cffd10ebb4a8e73a7 Mon Sep 17 00:00:00 2001 From: Tobias Gruetzmacher Date: Sun, 12 Feb 2017 02:16:38 +0100 Subject: [PATCH] Fix some modules. --- dosagelib/plugins/d.py | 28 ++++++++++------------------ dosagelib/plugins/k.py | 11 +---------- dosagelib/plugins/m.py | 17 ++++++++--------- dosagelib/plugins/o.py | 12 ++++++------ dosagelib/plugins/p.py | 13 ++----------- dosagelib/plugins/s.py | 21 +++++++++------------ 6 files changed, 36 insertions(+), 66 deletions(-) diff --git a/dosagelib/plugins/d.py b/dosagelib/plugins/d.py index 6233ef24c..30b30594b 100644 --- a/dosagelib/plugins/d.py +++ b/dosagelib/plugins/d.py @@ -1,7 +1,7 @@ # -*- coding: utf-8 -*- # Copyright (C) 2004-2008 Tristan Seligmann and Jonathan Jacobs # Copyright (C) 2012-2014 Bastian Kleineidam -# Copyright (C) 2015-2016 Tobias Gruetzmacher +# Copyright (C) 2015-2017 Tobias Gruetzmacher from __future__ import absolute_import, division, print_function @@ -219,20 +219,19 @@ class DreamKeepersPrelude(_ParserScraper): help = 'Index format: n' -class DresdenCodak(_BasicScraper): +class DresdenCodak(_ParserScraper): url = 'http://dresdencodak.com/' - rurl = escape(url) - stripUrl = None + startUrl = url + 'cat/comic/' firstStripUrl = url + '2007/02/08/pom/' - imageSearch = compile(tagre("img", "src", r'(%scomics/[^"]+)' % rurl)) - prevSearch = compile(tagre("a", "href", r'(%s[^"]+)' % rurl) + - tagre("img", "src", r"%sm_prev2?\.png" % rurl, - quote="")) - latestSearch = compile(tagre("div", "id", "preview") + - tagre("a", "href", - r'(%s\d+/\d+/\d+/[^"]+)' % rurl)) + imageSearch = '//section[%s]//img' % xpath_class('entry-content') + prevSearch = '//a[@rel="prev"]' + latestSearch = '//a[%s]' % xpath_class('tc-grid-bg-link') starter = indirectStarter + # Blog and comic are mixed... + def shouldSkipUrl(self, url, data): + return not data.xpath(self.imageSearch) + class DrFun(_BasicScraper): baseUrl = 'http://www.ibiblio.org/Dave/' @@ -287,10 +286,3 @@ class DumbingOfAge(_BasicScraper): prevSearch = compile(tagre("a", "href", r'(%s\d+/[^"]+)' % rurl, after="prev")) imageSearch = compile(tagre("img", "src", r'(%scomics/\d+-\d+-\d+[^"]+)' % rurl)) help = 'Index format: yyyy/comic/book-num/seriesname/stripname' - - -class DungeonsAndDenizens(_WordPressScraper): - url = 'http://dungeond.com/' - firstStripUrl = url + '2005/08/23/08232005/' - endOfLife = True - prevSearch = '//a[%s]' % xpath_class('navi-prev') diff --git a/dosagelib/plugins/k.py b/dosagelib/plugins/k.py index f5b498a18..7b99de411 100644 --- a/dosagelib/plugins/k.py +++ b/dosagelib/plugins/k.py @@ -1,7 +1,7 @@ # -*- coding: utf-8 -*- # Copyright (C) 2004-2008 Tristan Seligmann and Jonathan Jacobs # Copyright (C) 2012-2014 Bastian Kleineidam -# Copyright (C) 2015-2016 Tobias Gruetzmacher +# Copyright (C) 2015-2017 Tobias Gruetzmacher from __future__ import absolute_import, division, print_function @@ -27,15 +27,6 @@ class KevinAndKell(_BasicScraper): return self.stripUrl % tuple(map(int, index.split('-'))) -class Key(_BasicScraper): - baseUrl = 'http://key.shadilyn.com/' - url = baseUrl + 'latestpage.html' - stripUrl = baseUrl + 'pages/%s.html' - imageSearch = compile(r'"((?:images/.+?)|(?:pages/images/.+?))"') - prevSearch = compile(r'