import datetime import generic_news_rss_renderer as gnrss class seattletimes_rss_renderer(gnrss.generic_news_rss_renderer): interesting_categories = frozenset( [ "Nation", "World", "Life", "Technology" "Local News", "Food", "Drink", "Today File", "Seahawks", "Oddities", "Packfic NW", "Home", "Garden", "Travel", "Outdoors", ] ) def __init__(self, name_to_timeout_dict, feed_site, feed_uris, page_title): super(seattletimes_rss_renderer, self).__init__( name_to_timeout_dict, feed_site, feed_uris, page_title ) def debug_prefix(self): return "seattletimes" def get_headlines_page_prefix(self): return "seattletimes-nonnews" def get_details_page_prefix(self): return "seattletimes-details-nonnews" def should_use_https(self): return True def item_is_interesting_for_headlines(self, title, description, item): if item.tag != "item": self.debug_print("Item.tag isn't item?!") return False if self.is_item_older_than_n_days(item, 14): self.debug_print("%s: is too old!" % title) return False details = {} for detail in item.getchildren(): self.debug_print( "detail %s => %s (%s)" % (detail.tag, detail.attrib, detail.text) ) if detail.text != None: details[detail.tag] = detail.text if "category" not in details: self.debug_print("No category in details?!") self.debug_print(details) return False interesting = False for x in seattletimes_rss_renderer.interesting_categories: if x in details["category"]: self.debug_print("%s looks like a good category." % x) interesting = True if not interesting: return False return True def item_is_interesting_for_article(self, title, description, item): if self.is_item_older_than_n_days(item, 14): self.debug_print("%s: is too old!" % title) return False return len(description) >= 65 # Test # x = seattletimes_rss_renderer({"Test", 123}, # "www.seattletimes.com", # [ "/life/feed/" ], # "nonnews") # x.periodic_render("Fetch News") # x.periodic_render("Shuffle News")