GoComics doesn't allow spiders, disable them...
This removes 757 comics, including quite popular ones like Calvin and Hobbes, Garfield, FoxTrot, etc. :(
This commit is contained in:
parent
7c15ea50d8
commit
472afa24d3
1 changed files with 4 additions and 0 deletions
|
@ -17,6 +17,10 @@ _prevSearch = compile(tagre("a", "href", r'(/[^"]+/\d+/\d+/\d+)', after="prev"))
|
|||
_nextSearch = compile(tagre("a", "href", r'(/[^"]+/\d+/\d+/\d+)', after="next"))
|
||||
|
||||
def add(name, shortname):
|
||||
# Unfortunately, the whole http://assets.amuniversal.com/ is blocked by
|
||||
# robots.txt, so we disable GoComics for now...
|
||||
return
|
||||
|
||||
baseUrl = 'http://www.gocomics.com'
|
||||
url = baseUrl + shortname
|
||||
classname = 'GoComics_%s' % name
|
||||
|
|
Loading…
Reference in a new issue