import datetime import generic_news_rss_renderer as gnrss class seattletimes_rss_renderer(gnrss.generic_news_rss_renderer): interesting_categories = frozenset([ 'Nation', 'World', 'Life', 'Technology' 'Local News', 'Food', 'Drink', 'Today File', 'Seahawks', 'Oddities', 'Packfic NW', 'Home', 'Garden', 'Travel', 'Outdoors', ]) def __init__(self, name_to_timeout_dict, feed_site, feed_uris, page_title): super(seattletimes_rss_renderer, self).__init__( name_to_timeout_dict, feed_site, feed_uris, page_title) def debug_prefix(self): return "seattletimes" def get_headlines_page_prefix(self): return "seattletimes-nonnews" def get_details_page_prefix(self): return "seattletimes-details-nonnews" def should_use_https(self): return True def item_is_interesting_for_headlines(self, title, description, item): if item.tag != "item": self.debug_print("Item.tag isn't item?!") return False if self.is_item_older_than_n_days(item, 14): self.debug_print("%s: is too old!" % title) return False details = {} for detail in item.getchildren(): self.debug_print("detail %s => %s (%s)" % (detail.tag, detail.attrib, detail.text)) if detail.text != None: details[detail.tag] = detail.text if "category" not in details: self.debug_print("No category in details?!") self.debug_print(details) return False interesting = False for x in seattletimes_rss_renderer.interesting_categories: if x in details["category"]: self.debug_print("%s looks like a good category." % x) interesting = True if not interesting: return False return True def item_is_interesting_for_article(self, title, description, item): if self.is_item_older_than_n_days(item, 14): self.debug_print("%s: is too old!" % title) return False return len(description) >= 65 # Test #x = seattletimes_rss_renderer({"Test", 123}, # "www.seattletimes.com", # [ "/life/feed/" ], # "nonnews") #x.periodic_render("Fetch News") #x.periodic_render("Shuffle News")