Stop saying Belleve Reporter!
authorScott Gasch <[email protected]>
Sat, 18 Feb 2023 02:18:40 +0000 (18:18 -0800)
committerScott Gasch <[email protected]>
Sat, 18 Feb 2023 02:18:40 +0000 (18:18 -0800)
bellevue_reporter_rss_renderer.py

index 4420c80a5ed10ccbfd2b797efc88e99f9306e1c3..1e0ec0f700ece7e39367f859ac52c91cbab47ada 100644 (file)
@@ -22,9 +22,7 @@ class bellevue_reporter_rss_renderer(gnrss.generic_news_rss_renderer):
         feed_uris: List[str],
         page_title: str,
     ):
-        super().__init__(
-            name_to_timeout_dict, feed_site, feed_uris, page_title
-        )
+        super().__init__(name_to_timeout_dict, feed_site, feed_uris, page_title)
 
     def get_headlines_page_prefix(self) -> str:
         return "bellevue-reporter"
@@ -63,33 +61,42 @@ class bellevue_reporter_rss_renderer(gnrss.generic_news_rss_renderer):
             description is not None
             and title is not None
             and (
-                'marketplace' in description
-                or 'national-marketplace' in description
-                or re.search('[Ww]eed', title) is not None
-                or re.search('[Cc]annabis', title) is not None
-                or re.search('[Cc]annabis', description) is not None
-                or 'THC' in title
-                or re.search('[Tt]op.[Rr]ated', title) is not None
-                or re.search('[Ll]ose [Ww]eight', title) is not None
-                or re.search('[Ll]ose [Ww]eight', description) is not None
+                "marketplace" in description
+                or "national-marketplace" in description
+                or re.search("[Ww]eed", title) is not None
+                or re.search("[Cc]annabis", title) is not None
+                or re.search("[Cc]annabis", description) is not None
+                or "THC" in title
+                or re.search("[Tt]op.[Rr]ated", title) is not None
+                or re.search("[Ll]ose [Ww]eight", title) is not None
+                or re.search("[Ll]ose [Ww]eight", description) is not None
             )
         )
 
+    @staticmethod
+    def looks_very_boring(title: str, description: str) -> bool:
+        return description in title
+
     def item_is_interesting_for_headlines(
         self, title: str, description: str, item: xml.etree.ElementTree.Element
     ) -> bool:
         unfiltered_description = item.findtext("description")
         if self.is_item_older_than_n_days(item, 10):
-            logger.info(f'{title}: is too old!')
+            logger.info(f"{title}: is too old!")
             return False
-        if bellevue_reporter_rss_renderer.looks_like_spam(title, unfiltered_description):
-            logger.debug(f'{title}: looks like spam')
+        if bellevue_reporter_rss_renderer.looks_like_spam(
+            title, unfiltered_description
+        ):
+            logger.debug(f"{title}: looks like spam")
             return False
         if bellevue_reporter_rss_renderer.looks_like_football(title, description):
-            logger.debug(f'{title}: looks like it\'s about football.')
+            logger.debug(f"{title}: looks like it's about football.")
             return False
         if bellevue_reporter_rss_renderer.looks_like_review(title, description):
-            logger.debug(f'{title}: looks like a review.')
+            logger.debug(f"{title}: looks like a review.")
+            return False
+        if bellevue_reporter_rss_renderer.looks_very_boring(title, description):
+            logger.debug(f"{title}: looks very boring.")
             return False
         return True
 
@@ -98,16 +105,18 @@ class bellevue_reporter_rss_renderer(gnrss.generic_news_rss_renderer):
     ) -> bool:
         unfiltered_description = item.findtext("description")
         if self.is_item_older_than_n_days(item, 10):
-            logger.debug(f'{title}: is too old!')
+            logger.debug(f"{title}: is too old!")
             return False
-        if bellevue_reporter_rss_renderer.looks_like_spam(title, unfiltered_description):
-            logger.debug(f'{title}: looks like spam')
+        if bellevue_reporter_rss_renderer.looks_like_spam(
+            title, unfiltered_description
+        ):
+            logger.debug(f"{title}: looks like spam")
             return False
         if bellevue_reporter_rss_renderer.looks_like_football(title, description):
-            logger.debug(f'{title}: looks like it\'s about football.')
+            logger.debug(f"{title}: looks like it's about football.")
             return False
         if bellevue_reporter_rss_renderer.looks_like_review(title, description):
-            logger.debug(f'{title}: looks like a review.')
+            logger.debug(f"{title}: looks like a review.")
             return False
         return True