2017-05-14 22:54:02 +00:00
|
|
|
# -*- coding: utf-8 -*-
|
2016-10-28 22:21:41 +00:00
|
|
|
# Copyright (C) 2004-2008 Tristan Seligmann and Jonathan Jacobs
|
2017-05-14 22:54:02 +00:00
|
|
|
# Copyright (C) 2015-2017 Tobias Gruetzmacher
|
|
|
|
|
|
|
|
from __future__ import absolute_import, division, print_function
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
import xml.dom.minidom
|
|
|
|
import time
|
2013-02-10 07:00:32 +00:00
|
|
|
from .configuration import App
|
2012-06-20 19:58:13 +00:00
|
|
|
|
2017-05-14 22:54:02 +00:00
|
|
|
# TODO: Not sure if this RSS output is "valid", should be though.
|
|
|
|
# Might also be nice categorise Comics under one Item
|
|
|
|
|
|
|
|
|
2012-06-20 19:58:13 +00:00
|
|
|
class Feed(object):
|
2012-12-12 16:41:29 +00:00
|
|
|
"""Write an RSS feed with comic strip images."""
|
|
|
|
|
2013-02-10 07:00:32 +00:00
|
|
|
def __init__(self, title, link, description, lang='en-us', encoding="utf-8"):
|
2012-12-12 16:41:29 +00:00
|
|
|
"""Initialize RSS writer with given title, link and description."""
|
2013-02-10 07:00:32 +00:00
|
|
|
self.encoding = encoding
|
2012-06-20 19:58:13 +00:00
|
|
|
self.rss = xml.dom.minidom.Document()
|
2013-02-10 07:00:32 +00:00
|
|
|
root = self.rss.appendChild(self.rss.createElement('rss'))
|
|
|
|
root.setAttribute('version', '2.0')
|
|
|
|
self.channel = root.appendChild(self.rss.createElement('channel'))
|
2012-06-20 19:58:13 +00:00
|
|
|
self.addElement(self.channel, 'title', title)
|
|
|
|
self.addElement(self.channel, 'link', link)
|
|
|
|
self.addElement(self.channel, 'language', lang)
|
|
|
|
self.addElement(self.channel, 'description', description)
|
2013-02-10 07:00:32 +00:00
|
|
|
self.addElement(self.channel, 'generator', App)
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
def addElement(self, parent, tag, value):
|
2012-12-12 16:41:29 +00:00
|
|
|
"""Add an RSS item."""
|
2013-02-10 07:00:32 +00:00
|
|
|
elem = self.rss.createElement(tag)
|
|
|
|
node = self.rss.createTextNode(value)
|
|
|
|
return parent.appendChild(elem).appendChild(node)
|
2012-06-20 19:58:13 +00:00
|
|
|
|
2013-02-10 07:00:32 +00:00
|
|
|
def addItem(self, title, link, description, date, append=True):
|
2012-12-12 16:41:29 +00:00
|
|
|
"""Insert an item."""
|
2012-06-20 19:58:13 +00:00
|
|
|
item = self.rss.createElement('item')
|
|
|
|
|
|
|
|
self.addElement(item, 'title', title)
|
|
|
|
self.addElement(item, 'link', link)
|
|
|
|
self.addElement(item, 'description', description)
|
2013-02-10 07:00:32 +00:00
|
|
|
self.addElement(item, 'guid', link)
|
2012-06-20 19:58:13 +00:00
|
|
|
self.addElement(item, 'pubDate', date)
|
|
|
|
|
2013-02-10 07:00:32 +00:00
|
|
|
if append:
|
|
|
|
self.channel.appendChild(item)
|
|
|
|
else:
|
|
|
|
elems = self.rss.getElementsByTagName('item')
|
|
|
|
if elems:
|
|
|
|
self.channel.insertBefore(item, elems[0])
|
|
|
|
else:
|
|
|
|
self.channel.appendChild(item)
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
def write(self, path):
|
2012-12-12 16:41:29 +00:00
|
|
|
"""Write RSS content to file."""
|
2013-04-05 17:27:30 +00:00
|
|
|
with open(path, 'wb') as f:
|
2013-02-10 07:00:32 +00:00
|
|
|
f.write(self.getXML())
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
def getXML(self):
|
2012-12-12 16:41:29 +00:00
|
|
|
"""Get RSS content in XML format."""
|
2013-02-10 07:00:32 +00:00
|
|
|
return self.rss.toxml(self.encoding)
|
2012-06-20 19:58:13 +00:00
|
|
|
|
2012-12-12 16:41:29 +00:00
|
|
|
|
2012-06-20 19:58:13 +00:00
|
|
|
def parseFeed(filename, yesterday):
|
2012-12-12 16:41:29 +00:00
|
|
|
"""Parse an RSS feed and filter only entries that are newer than yesterday."""
|
2012-06-20 19:58:13 +00:00
|
|
|
dom = xml.dom.minidom.parse(filename)
|
|
|
|
|
2017-05-14 22:54:02 +00:00
|
|
|
def getText(node, tag):
|
|
|
|
node.getElementsByTagName(tag)[0].childNodes[0].data
|
|
|
|
|
|
|
|
def getNode(tag):
|
|
|
|
dom.getElementsByTagName(tag)
|
2012-06-20 19:58:13 +00:00
|
|
|
|
2017-05-14 22:54:02 +00:00
|
|
|
content = getNode('channel')[0] # Only one channel node
|
2012-06-20 19:58:13 +00:00
|
|
|
|
|
|
|
feedTitle = getText(content, 'title')
|
|
|
|
feedLink = getText(content, 'link')
|
|
|
|
feedDesc = getText(content, 'description')
|
|
|
|
|
|
|
|
feed = Feed(feedTitle, feedLink, feedDesc)
|
|
|
|
|
|
|
|
for item in getNode('item'):
|
|
|
|
itemDate = time.strptime(getText(item, 'pubDate'), '%a, %d %b %Y %H:%M:%S GMT')
|
2017-05-14 22:54:02 +00:00
|
|
|
if (itemDate > yesterday): # If newer than yesterday
|
2012-06-20 19:58:13 +00:00
|
|
|
feed.addItem(getText(item, 'title'),
|
|
|
|
getText(item, 'link'),
|
|
|
|
getText(item, 'description'),
|
|
|
|
getText(item, 'pubDate'))
|
|
|
|
return feed
|