Also check robots.txt on image downloads.

We DO want to honour if images are blocked by robots.txt
This commit is contained in:
Tobias Gruetzmacher 2015-07-15 23:50:57 +02:00
parent 5affd8af68
commit 7c15ea50d8

View file

@ -205,6 +205,7 @@ def getPageContent(url, session, max_content_bytes=MaxContentBytes):
def getImageObject(url, referrer, session, max_content_bytes=MaxImageBytes):
"""Get response object for given image URL."""
check_robotstxt(url, session)
return urlopen(url, session, referrer=referrer, max_content_bytes=max_content_bytes, stream=True)