+ @staticmethod
+ def looks_like_football(title: str, description: str) -> bool:
+ return (
+ title.find("NFL") != -1
+ or re.search("[Ll]ive [Ss]tream", title) is not None
+ or re.search("[Ll]ive[Ss]tream", title) is not None
+ or re.search("[Ll]ive [Ss]tream", description) is not None
+ )
+
+ @staticmethod
+ def looks_like_review(title: str, description: str) -> bool:
+ return "review" in title or "Review" in title
+
+ @staticmethod
+ def looks_like_spam(title: str, description: str) -> bool:
+ return (
+ description is not None
+ and title is not None
+ and (
+ "marketplace" in description
+ or "national-marketplace" in description
+ or re.search("[Ww]eed", title) is not None
+ or re.search("[Cc]annabis", title) is not None
+ or re.search("[Cc]annabis", description) is not None
+ or "THC" in title
+ or re.search("[Tt]op.[Rr]ated", title) is not None
+ or re.search("[Ll]ose [Ww]eight", title) is not None
+ or re.search("[Ll]ose [Ww]eight", description) is not None
+ )
+ )
+
+ @staticmethod
+ def looks_very_boring(title: str, description: str) -> bool:
+ return description.lower() in title.lower()
+
+ def item_is_interesting_for_headlines(
+ self, title: str, description: str, item: xml.etree.ElementTree.Element
+ ) -> bool:
+ unfiltered_description = item.findtext("description")
+ if self.is_item_older_than_n_days(item, 10):
+ logger.info(f"{title}: is too old!")
+ return False
+ if bellevue_reporter_rss_renderer.looks_like_spam(
+ title, unfiltered_description
+ ):
+ logger.debug(f"{title}: looks like spam")
+ return False
+ if bellevue_reporter_rss_renderer.looks_like_football(title, description):
+ logger.debug(f"{title}: looks like it's about football.")
+ return False
+ if bellevue_reporter_rss_renderer.looks_like_review(title, description):
+ logger.debug(f"{title}: looks like a review.")
+ return False
+ if bellevue_reporter_rss_renderer.looks_very_boring(title, description):
+ logger.debug(f"{title}: looks very boring.")
+ return False
+ return True
+
+ def item_is_interesting_for_article(
+ self, title: str, description: str, item: xml.etree.ElementTree.Element
+ ) -> bool:
+ unfiltered_description = item.findtext("description")
+ if self.is_item_older_than_n_days(item, 10):
+ logger.debug(f"{title}: is too old!")
+ return False
+ if bellevue_reporter_rss_renderer.looks_like_spam(
+ title, unfiltered_description
+ ):
+ logger.debug(f"{title}: looks like spam")
+ return False
+ if bellevue_reporter_rss_renderer.looks_like_football(title, description):
+ logger.debug(f"{title}: looks like it's about football.")
+ return False
+ if bellevue_reporter_rss_renderer.looks_like_review(title, description):
+ logger.debug(f"{title}: looks like a review.")
+ return False
+ return True