import datetime
import generic_news_rss_renderer as gnrss
+
class seattletimes_rss_renderer(gnrss.generic_news_rss_renderer):
- interesting_categories = frozenset([
- 'Nation',
- 'World',
- 'Life',
- 'Technology'
- 'Local News',
- 'Food',
- 'Drink',
- 'Today File',
- 'Seahawks',
- 'Oddities',
- 'Packfic NW',
- 'Home',
- 'Garden',
- 'Travel',
- 'Outdoors',
- ])
+ interesting_categories = frozenset(
+ [
+ "Nation",
+ "World",
+ "Life",
+ "Technology" "Local News",
+ "Food",
+ "Drink",
+ "Today File",
+ "Seahawks",
+ "Oddities",
+ "Packfic NW",
+ "Home",
+ "Garden",
+ "Travel",
+ "Outdoors",
+ ]
+ )
def __init__(self, name_to_timeout_dict, feed_site, feed_uris, page_title):
super(seattletimes_rss_renderer, self).__init__(
- name_to_timeout_dict,
- feed_site,
- feed_uris,
- page_title)
+ name_to_timeout_dict, feed_site, feed_uris, page_title
+ )
def debug_prefix(self):
return "seattletimes"
self.debug_print("Item.tag isn't item?!")
return False
if self.is_item_older_than_n_days(item, 14):
+ self.debug_print("%s: is too old!" % title)
return False
details = {}
for detail in item.getchildren():
- self.debug_print("detail %s => %s (%s)" % (detail.tag,
- detail.attrib,
- detail.text))
+ self.debug_print(
+ "detail %s => %s (%s)" % (detail.tag, detail.attrib, detail.text)
+ )
if detail.text != None:
details[detail.tag] = detail.text
if "category" not in details:
interesting = True
if not interesting:
return False
-
- if 'enclosure' in details:
- if 'pubDate' in details:
- x = details['pubDate']
- x = x.rsplit(' ', 1)[0]
- # Fri, 13 Nov 2015 10:07:00
- dt = datetime.datetime.strptime(x, '%a, %d %b %Y %H:%M:%S')
- if dt < self.oldest:
- self.debug_print("%s is too old." % (
- details["pubDate"]))
- return False
return True
def item_is_interesting_for_article(self, title, description, item):
if self.is_item_older_than_n_days(item, 14):
+ self.debug_print("%s: is too old!" % title)
return False
return len(description) >= 65
-#x = seattletimes_rss_renderer({"Test", 123},
+
+# Test
+# x = seattletimes_rss_renderer({"Test", 123},
# "www.seattletimes.com",
# [ "/life/feed/" ],
# "nonnews")
-#x.periodic_render("Fetch News")
-#x.periodic_render("Shuffle News")
+# x.periodic_render("Fetch News")
+# x.periodic_render("Shuffle News")