More cleanup, yey!

author Scott Gasch <scott@gasch.org>

Wed, 9 Feb 2022 01:46:56 +0000 (17:46 -0800)

committer Scott Gasch <scott@gasch.org>

Wed, 9 Feb 2022 01:46:56 +0000 (17:46 -0800)
author Scott Gasch <scott@gasch.org>
Wed, 9 Feb 2022 01:46:56 +0000 (17:46 -0800)
committer Scott Gasch <scott@gasch.org>
Wed, 9 Feb 2022 01:46:56 +0000 (17:46 -0800)
diff --git a/function_utils.py b/function_utils.py

index 3c8e4ae10f4f493edb22c35ad3758442b4f224dd..f10776211df3ef8347d48486671577bc18d044bc 100644 (file)
--- a/function_utils.py
+++ b/function_utils.py
@@ -1,5 +1,7 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""Helper methods dealing with functions."""
+
  from typing import Callable
  
  
  from typing import Callable
  
  
diff --git a/google_assistant.py b/google_assistant.py

index b0aabf37095ef986b35b726d02700f55d017f78b..4a3a58f5947ab335e26ac2fa1c7ce22afd841a93 100644 (file)
--- a/google_assistant.py
+++ b/google_assistant.py
@@ -1,7 +1,9 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""A module to serve as a local client library around HTTP calls to
+the Google Assistant via a local gateway."""
+
  import logging
  import logging
-import sys
  import warnings
  from typing import NamedTuple, Optional
  
  import warnings
  from typing import NamedTuple, Optional
  
@@ -33,6 +35,8 @@ parser.add_argument(
  
  
  class GoogleResponse(NamedTuple):
  
  
  class GoogleResponse(NamedTuple):
+    """A response wrapper."""
+
      success: bool
      response: str
      audio_url: str
      success: bool
      response: str
      audio_url: str
@@ -57,7 +61,7 @@ def ask_google(cmd: str, *, recognize_speech=True) -> GoogleResponse:
      is True, perform speech recognition on the audio response from Google so as
      to translate it into text (best effort, YMMV).
      """
      is True, perform speech recognition on the audio response from Google so as
      to translate it into text (best effort, YMMV).
      """
-    logging.debug(f"Asking google: '{cmd}'")
+    logging.debug("Asking google: '%s'", cmd)
      payload = {
          "command": cmd,
          "user": config.config['google_assistant_username'],
      payload = {
          "command": cmd,
          "user": config.config['google_assistant_username'],
@@ -76,7 +80,7 @@ def ask_google(cmd: str, *, recognize_speech=True) -> GoogleResponse:
          if success:
              logger.debug('Google request succeeded.')
              if len(response) > 0:
          if success:
              logger.debug('Google request succeeded.')
              if len(response) > 0:
-                logger.debug(f"Google said: '{response}'")
+                logger.debug("Google said: '%s'", response)
          audio = f"{config.config['google_assistant_bridge']}{j['audio']}"
          if recognize_speech:
              recognizer = sr.Recognizer()
          audio = f"{config.config['google_assistant_bridge']}{j['audio']}"
          if recognize_speech:
              recognizer = sr.Recognizer()
@@ -92,7 +96,7 @@ def ask_google(cmd: str, *, recognize_speech=True) -> GoogleResponse:
                      audio_transcription = recognizer.recognize_google(
                          speech,
                      )
                      audio_transcription = recognizer.recognize_google(
                          speech,
                      )
-                    logger.debug(f"Transcription: '{audio_transcription}'")
+                    logger.debug("Transcription: '%s'", audio_transcription)
                  except sr.UnknownValueError as e:
                      logger.exception(e)
                      msg = 'Unable to parse Google assistant\'s response.'
                  except sr.UnknownValueError as e:
                      logger.exception(e)
                      msg = 'Unable to parse Google assistant\'s response.'
@@ -114,4 +118,3 @@ def ask_google(cmd: str, *, recognize_speech=True) -> GoogleResponse:
              audio_url=audio,
              audio_transcription=audio_transcription,
          )
              audio_url=audio,
              audio_transcription=audio_transcription,
          )
-        sys.exit(-1)
diff --git a/histogram.py b/histogram.py

index c673e161a6318fabeb155e1cdb2a2591abe730e0..f85abea2c45f05ef65c70657bd1b2b6f53f04c04 100644 (file)
--- a/histogram.py
+++ b/histogram.py
@@ -1,8 +1,9 @@
  #!/usr/bin/env python3
  # -*- coding: utf-8 -*-
  
  #!/usr/bin/env python3
  # -*- coding: utf-8 -*-
  
+"""A text-based simple histogram helper class."""
+
  import math
  import math
-from numbers import Number
  from typing import Dict, Generic, Iterable, List, Optional, Tuple, TypeVar
  
  T = TypeVar("T", int, float)
  from typing import Dict, Generic, Iterable, List, Optional, Tuple, TypeVar
  
  T = TypeVar("T", int, float)
@@ -11,6 +12,8 @@ Count = int
  
  
  class SimpleHistogram(Generic[T]):
  
  
  class SimpleHistogram(Generic[T]):
+    """A simple histogram."""
+
      # Useful in defining wide open bottom/top bucket bounds:
      POSITIVE_INFINITY = math.inf
      NEGATIVE_INFINITY = -math.inf
      # Useful in defining wide open bottom/top bucket bounds:
      POSITIVE_INFINITY = math.inf
      NEGATIVE_INFINITY = -math.inf
diff --git a/id_generator.py b/id_generator.py

index d4c70166bb3c52974793840cb8bebbf288500a49..dc2ac9cc810a4e1d588d60231371e873d9d31966 100644 (file)
--- a/id_generator.py
+++ b/id_generator.py
@@ -1,5 +1,8 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""A helper class for generating thread safe monotonically increasing
+id numbers."""
+
  import itertools
  import logging
  
  import itertools
  import logging
  
@@ -28,7 +31,7 @@ def get(name: str, *, start=0) -> int:
      if name not in generators:
          generators[name] = itertools.count(start, 1)
      x = next(generators[name])
      if name not in generators:
          generators[name] = itertools.count(start, 1)
      x = next(generators[name])
-    logger.debug(f"Generated next id {x}")
+    logger.debug("Generated next id %d", x)
      return x
  
  
      return x
  
  
diff --git a/input_utils.py b/input_utils.py

index a166d7a4169e56937e8bb63c4398aff1abc52564..7d5e18089331a96bc32172b90e916a37c0695d49 100644 (file)
--- a/input_utils.py
+++ b/input_utils.py
@@ -37,7 +37,7 @@ def single_keystroke_response(
          try:
              while True:
                  response = readchar.readchar()
          try:
              while True:
                  response = readchar.readchar()
-                logger.debug(f'Keystroke: {ord(response)}')
+                logger.debug('Keystroke: 0x%x', ord(response))
                  if response in valid_responses:
                      break
                  if ord(response) in os_special_keystrokes:
                  if response in valid_responses:
                      break
                  if ord(response) in os_special_keystrokes:
diff --git a/letter_compress.py b/letter_compress.py

index 9b4cf194c3d97a83c68c47bd0199a65c3a6e1698..42f06dae79a8357bcffd0730194d5c2d1d352f11 100644 (file)
--- a/letter_compress.py
+++ b/letter_compress.py
@@ -1,5 +1,7 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""A simple compression helper for lowercase ascii text."""
+
  import bitstring
  
  from collect.bidict import BiDict
  import bitstring
  
  from collect.bidict import BiDict
@@ -32,14 +34,12 @@ def compress(uncompressed: str) -> bytes:
  
      """
      compressed = bitstring.BitArray()
  
      """
      compressed = bitstring.BitArray()
-    for (n, letter) in enumerate(uncompressed):
+    for letter in uncompressed:
          if 'a' <= letter <= 'z':
              bits = ord(letter) - ord('a') + 1  # 1..26
          else:
              if letter not in special_characters:
          if 'a' <= letter <= 'z':
              bits = ord(letter) - ord('a') + 1  # 1..26
          else:
              if letter not in special_characters:
-                raise Exception(
-                    f'"{uncompressed}" contains uncompressable char="{letter}"'
-                )
+                raise Exception(f'"{uncompressed}" contains uncompressable char="{letter}"')
              bits = special_characters[letter]
          compressed.append(f"uint:5={bits}")
      while len(compressed) % 8 != 0:
              bits = special_characters[letter]
          compressed.append(f"uint:5={bits}")
      while len(compressed) % 8 != 0:
diff --git a/list_utils.py b/list_utils.py

index d70159a1b2dadb61640eae20f029608cabd2f46e..91af8f9eb924fb7e7e04932d58a1bcb6eded0690 100644 (file)
--- a/list_utils.py
+++ b/list_utils.py
@@ -1,8 +1,10 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""Some useful(?) utilities for dealing with Lists."""
+
  from collections import Counter
  from itertools import islice
  from collections import Counter
  from itertools import islice
-from typing import Any, Iterator, List, Mapping, Sequence, Tuple
+from typing import Any, Iterator, List, Sequence, Tuple
  
  
  def shard(lst: List[Any], size: int) -> Iterator[Any]:
  
  
  def shard(lst: List[Any], size: int) -> Iterator[Any]:
@@ -230,9 +232,7 @@ def _permute(seq: str, path: str):
          yield from _permute(cdr, path + car)
  
  
          yield from _permute(cdr, path + car)
  
  
-def binary_search(
-    lst: Sequence[Any], target: Any, *, sanity_check=False
-) -> Tuple[bool, int]:
+def binary_search(lst: Sequence[Any], target: Any, *, sanity_check=False) -> Tuple[bool, int]:
      """Performs a binary search on lst (which must already be sorted).
      Returns a Tuple composed of a bool which indicates whether the
      target was found and an int which indicates the index closest to
      """Performs a binary search on lst (which must already be sorted).
      Returns a Tuple composed of a bool which indicates whether the
      target was found and an int which indicates the index closest to
@@ -267,9 +267,7 @@ def binary_search(
      return _binary_search(lst, target, 0, len(lst) - 1)
  
  
      return _binary_search(lst, target, 0, len(lst) - 1)
  
  
-def _binary_search(
-    lst: Sequence[Any], target: Any, low: int, high: int
-) -> Tuple[bool, int]:
+def _binary_search(lst: Sequence[Any], target: Any, low: int, high: int) -> Tuple[bool, int]:
      if high >= low:
          mid = (high + low) // 2
          if lst[mid] == target:
      if high >= low:
          mid = (high + low) // 2
          if lst[mid] == target:
diff --git a/lockfile.py b/lockfile.py

index 290710759dbc702fff757ae2561fe5c0af3051a6..6993cb84d5e88f8dd6fc1a9d28a849f0cfd28713 100644 (file)
--- a/lockfile.py
+++ b/lockfile.py
@@ -1,5 +1,7 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""File-based locking helper."""
+
  import datetime
  import json
  import logging
  import datetime
  import json
  import logging
@@ -26,11 +28,15 @@ logger = logging.getLogger(__name__)
  
  
  class LockFileException(Exception):
  
  
  class LockFileException(Exception):
+    """An exception related to lock files."""
+
      pass
  
  
  @dataclass
  class LockFileContents:
      pass
  
  
  @dataclass
  class LockFileContents:
+    """The contents we'll write to each lock file."""
+
      pid: int
      commandline: str
      expiration_timestamp: Optional[float]
      pid: int
      commandline: str
      expiration_timestamp: Optional[float]
@@ -56,9 +62,10 @@ class LockFile(object):
          expiration_timestamp: Optional[float] = None,
          override_command: Optional[str] = None,
      ) -> None:
          expiration_timestamp: Optional[float] = None,
          override_command: Optional[str] = None,
      ) -> None:
-        self.is_locked = False
-        self.lockfile = lockfile_path
-        self.override_command = override_command
+        self.is_locked: bool = False
+        self.lockfile: str = lockfile_path
+        self.locktime: Optional[int] = None
+        self.override_command: Optional[str] = override_command
          if do_signal_cleanup:
              signal.signal(signal.SIGINT, self._signal)
              signal.signal(signal.SIGTERM, self._signal)
          if do_signal_cleanup:
              signal.signal(signal.SIGINT, self._signal)
              signal.signal(signal.SIGTERM, self._signal)
@@ -71,7 +78,7 @@ class LockFile(object):
          return not os.path.exists(self.lockfile)
  
      def try_acquire_lock_once(self) -> bool:
          return not os.path.exists(self.lockfile)
  
      def try_acquire_lock_once(self) -> bool:
-        logger.debug(f"Trying to acquire {self.lockfile}.")
+        logger.debug("Trying to acquire %s.", self.lockfile)
          try:
              # Attempt to create the lockfile.  These flags cause
              # os.open to raise an OSError if the file already
          try:
              # Attempt to create the lockfile.  These flags cause
              # os.open to raise an OSError if the file already
@@ -81,13 +88,12 @@ class LockFile(object):
                  contents = self._get_lockfile_contents()
                  logger.debug(contents)
                  f.write(contents)
                  contents = self._get_lockfile_contents()
                  logger.debug(contents)
                  f.write(contents)
-            logger.debug(f'Success; I own {self.lockfile}.')
+            logger.debug('Success; I own %s.', self.lockfile)
              self.is_locked = True
              return True
          except OSError:
              pass
              self.is_locked = True
              return True
          except OSError:
              pass
-        msg = f'Could not acquire {self.lockfile}.'
-        logger.warning(msg)
+        logger.warning('Couldn\'t acquire %s.', self.lockfile)
          return False
  
      def acquire_with_retries(
          return False
  
      def acquire_with_retries(
@@ -125,7 +131,7 @@ class LockFile(object):
          logger.warning(msg)
          raise LockFileException(msg)
  
          logger.warning(msg)
          raise LockFileException(msg)
  
-    def __exit__(self, type, value, traceback):
+    def __exit__(self, _, value, traceback):
          if self.locktime:
              ts = datetime.datetime.now().timestamp()
              duration = ts - self.locktime
          if self.locktime:
              ts = datetime.datetime.now().timestamp()
              duration = ts - self.locktime
@@ -164,7 +170,7 @@ class LockFile(object):
                      line = lines[0]
                      line_dict = json.loads(line)
                      contents = LockFileContents(**line_dict)
                      line = lines[0]
                      line_dict = json.loads(line)
                      contents = LockFileContents(**line_dict)
-                    logger.debug(f'Blocking lock contents="{contents}"')
+                    logger.debug('Blocking lock contents="%s"', contents)
  
                      # Does the PID exist still?
                      try:
  
                      # Does the PID exist still?
                      try:
diff --git a/logging_utils.py b/logging_utils.py

index ca1544150065b367b976d9ca43382fa1a6cff5e5..706a0543a93c4fa04b37ed87b6519405fd4505cf 100644 (file)
--- a/logging_utils.py
+++ b/logging_utils.py
@@ -14,7 +14,7 @@ import random
  import sys
  from logging.config import fileConfig
  from logging.handlers import RotatingFileHandler, SysLogHandler
  import sys
  from logging.config import fileConfig
  from logging.handlers import RotatingFileHandler, SysLogHandler
-from typing import Any, Callable, Dict, Iterable, List, Mapping, Optional
+from typing import Any, Callable, Dict, Iterable, List, Optional
  
  import pytz
  from overrides import overrides
  
  import pytz
  from overrides import overrides
@@ -175,8 +175,8 @@ cfg.add_argument(
      ),
  )
  
      ),
  )
  
-built_in_print = print
-logging_initialized = False
+BUILT_IN_PRINT = print
+LOGGING_INITIALIZED = False
  
  
  # A map from logging_callsite_id -> count of logged messages.
  
  
  # A map from logging_callsite_id -> count of logged messages.
@@ -390,7 +390,7 @@ class MillisecondAwareFormatter(logging.Formatter):
              s = ct.strftime(datefmt)
          else:
              t = ct.strftime("%Y-%m-%d %H:%M:%S")
              s = ct.strftime(datefmt)
          else:
              t = ct.strftime("%Y-%m-%d %H:%M:%S")
-            s = "%s,%03d" % (t, record.msecs)
+            s = f"{t},{record.msecs:%03d}"
          return s
  
  
          return s
  
  
@@ -454,10 +454,10 @@ def log_about_logging(
  
  
  def initialize_logging(logger=None) -> logging.Logger:
  
  
  def initialize_logging(logger=None) -> logging.Logger:
-    global logging_initialized
-    if logging_initialized:
+    global LOGGING_INITIALIZED
+    if LOGGING_INITIALIZED:
          return logging.getLogger()
          return logging.getLogger()
-    logging_initialized = True
+    LOGGING_INITIALIZED = True
  
      if logger is None:
          logger = logging.getLogger()
  
      if logger is None:
          logger = logging.getLogger()
@@ -479,7 +479,7 @@ def initialize_logging(logger=None) -> logging.Logger:
      # Global default logging level (--logging_level)
      default_logging_level = getattr(logging, config.config['logging_level'].upper(), None)
      if not isinstance(default_logging_level, int):
      # Global default logging level (--logging_level)
      default_logging_level = getattr(logging, config.config['logging_level'].upper(), None)
      if not isinstance(default_logging_level, int):
-        raise ValueError('Invalid level: %s' % config.config['logging_level'])
+        raise ValueError(f'Invalid level: {config.config["logging_level"]}')
  
      if config.config['logging_format']:
          fmt = config.config['logging_format']
  
      if config.config['logging_format']:
          fmt = config.config['logging_format']
@@ -563,7 +563,6 @@ def initialize_logging(logger=None) -> logging.Logger:
      logger.propagate = False
  
      if config.config['logging_captures_prints']:
      logger.propagate = False
  
      if config.config['logging_captures_prints']:
-        global built_in_print
          import builtins
  
          def print_and_also_log(*arg, **kwarg):
          import builtins
  
          def print_and_also_log(*arg, **kwarg):
@@ -572,7 +571,7 @@ def initialize_logging(logger=None) -> logging.Logger:
                  logger.warning(*arg)
              else:
                  logger.info(*arg)
                  logger.warning(*arg)
              else:
                  logger.info(*arg)
-            built_in_print(*arg, **kwarg)
+            BUILT_IN_PRINT(*arg, **kwarg)
  
          builtins.print = print_and_also_log
  
  
          builtins.print = print_and_also_log
  
@@ -667,7 +666,7 @@ class OutputMultiplexer(object):
  
          self.h: Optional[List[Any]] = None
          if handles is not None:
  
          self.h: Optional[List[Any]] = None
          if handles is not None:
-            self.h = [handle for handle in handles]
+            self.h = list(handles)
          else:
              if destination_bitv & OutputMultiplexer.Destination.FILEHANDLES:
                  raise ValueError("Handle argument is required if bitv & FILEHANDLES")
          else:
              if destination_bitv & OutputMultiplexer.Destination.FILEHANDLES:
                  raise ValueError("Handle argument is required if bitv & FILEHANDLES")
diff --git a/logical_search.py b/logical_search.py

index 76c2f86264be3fc49960166fe7a1b702f90e6c4b..b55e68901501ad2e68a7f45df034866072c3f61b 100644 (file)
--- a/logical_search.py
+++ b/logical_search.py
@@ -1,5 +1,9 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""This is a module concerned with the creation of and searching of a
+corpus of documents.  The corpus is held in memory for fast
+searching."""
+
  from __future__ import annotations
  
  import enum
  from __future__ import annotations
  
  import enum
@@ -12,6 +16,7 @@ class ParseError(Exception):
      """An error encountered while parsing a logical search expression."""
  
      def __init__(self, message: str):
      """An error encountered while parsing a logical search expression."""
  
      def __init__(self, message: str):
+        super().__init__()
          self.message = message
  
  
          self.message = message
  
  
diff --git a/math_utils.py b/math_utils.py

index 3953ae585d249123c17e82f4a829ad68cf442c0b..37fcec5f6c557cdf1a66d39b671fd8d9438ba29c 100644 (file)
--- a/math_utils.py
+++ b/math_utils.py
@@ -1,5 +1,7 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""Mathematical helpers."""
+
  import functools
  import math
  from heapq import heappop, heappush
  import functools
  import math
  from heapq import heappop, heappush
@@ -76,8 +78,8 @@ def truncate_float(n: float, decimals: int = 2):
      3.141
  
      """
      3.141
  
      """
-    assert decimals > 0 and decimals < 10
-    multiplier = 10 ** decimals
+    assert 0 < decimals < 10
+    multiplier = 10**decimals
      return int(n * multiplier) / multiplier
  
  
      return int(n * multiplier) / multiplier
  
  
diff --git a/misc_utils.py b/misc_utils.py

index 4979a3c65bcb377b813b18868962297f80b0bd1d..a73728a28031d48703187ff3a86274ec05ab2950 100644 (file)
--- a/misc_utils.py
+++ b/misc_utils.py
@@ -1,5 +1,7 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""Miscellaneous utilities."""
+
  import os
  
  
  import os
  
  
diff --git a/parallelize.py b/parallelize.py

index f2cfcbb144fbbff5620b4fea081b1493c8cabdcd..b2a1cedb988d98d78cf7654e3f65d4dfaa8beff6 100644 (file)
--- a/parallelize.py
+++ b/parallelize.py
@@ -10,6 +10,8 @@ from enum import Enum
  
  
  class Method(Enum):
  
  
  class Method(Enum):
+    """How should we parallelize; by threads, processes or remote workers?"""
+
      THREAD = 1
      PROCESS = 2
      REMOTE = 3
      THREAD = 1
      PROCESS = 2
      REMOTE = 3
diff --git a/persistent.py b/persistent.py

index 119931b8ccba607ccc48321ac6f3d6dd3dd5b791..c902313eb4a28cb4635779f584f8775a2b646d35 100644 (file)
--- a/persistent.py
+++ b/persistent.py
@@ -1,5 +1,9 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""A Persistent is just a class with a load and save method.  This
+module defines the Persistent base and a decorator that can be used to
+create a persistent singleton that autoloads and autosaves."""
+
  import atexit
  import datetime
  import enum
  import atexit
  import datetime
  import enum
@@ -136,21 +140,21 @@ class persistent_autoloaded_singleton(object):
              # memory.
              if self.instance is not None:
                  logger.debug(
              # memory.
              if self.instance is not None:
                  logger.debug(
-                    f'Returning already instantiated singleton instance of {cls.__name__}.'
+                    'Returning already instantiated singleton instance of %s.', cls.__name__
                  )
                  return self.instance
  
              # Otherwise, try to load it from persisted state.
              was_loaded = False
                  )
                  return self.instance
  
              # Otherwise, try to load it from persisted state.
              was_loaded = False
-            logger.debug(f'Attempting to load {cls.__name__} from persisted state.')
+            logger.debug('Attempting to load %s from persisted state.', cls.__name__)
              self.instance = cls.load()
              if not self.instance:
                  msg = 'Loading from cache failed.'
                  logger.warning(msg)
              self.instance = cls.load()
              if not self.instance:
                  msg = 'Loading from cache failed.'
                  logger.warning(msg)
-                logger.debug(f'Attempting to instantiate {cls.__name__} directly.')
+                logger.debug('Attempting to instantiate %s directly.', cls.__name__)
                  self.instance = cls(*args, **kwargs)
              else:
                  self.instance = cls(*args, **kwargs)
              else:
-                logger.debug(f'Class {cls.__name__} was loaded from persisted state successfully.')
+                logger.debug('Class %s was loaded from persisted state successfully.', cls.__name__)
                  was_loaded = True
  
              assert self.instance is not None
                  was_loaded = True
  
              assert self.instance is not None
diff --git a/profanity_filter.py b/profanity_filter.py

index e5c9e11b59a9f45b0aed4288a61b9fed09ca34ee..37756bac99abdaaa298b92ab7ff4f984ec844d51 100755 (executable)
--- a/profanity_filter.py
+++ b/profanity_filter.py
@@ -1,5 +1,7 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""A helper to identify and optionally obscure some bad words."""
+
  import logging
  import random
  import re
  import logging
  import random
  import re
@@ -17,6 +19,8 @@ logger = logging.getLogger(__name__)
  
  @decorator_utils.singleton
  class ProfanityFilter(object):
  
  @decorator_utils.singleton
  class ProfanityFilter(object):
+    """A helper to identify and optionally obscure some bad words."""
+
      def __init__(self):
          self.bad_words = set(
              [
      def __init__(self):
          self.bad_words = set(
              [
@@ -499,7 +503,8 @@ class ProfanityFilter(object):
          chunks = [self.stemmer.stem(word) for word in nltk.word_tokenize(result)]
          return ' '.join(chunks)
  
          chunks = [self.stemmer.stem(word) for word in nltk.word_tokenize(result)]
          return ' '.join(chunks)
  
-    def tokenize(self, text: str):
+    @staticmethod
+    def tokenize(text: str):
          for x in nltk.word_tokenize(text):
              for y in re.split(r'\W+', x):
                  yield y
          for x in nltk.word_tokenize(text):
              for y in re.split(r'\W+', x):
                  yield y
@@ -518,24 +523,24 @@ class ProfanityFilter(object):
          False
  
          """
          False
  
          """
-        words = [word for word in self.tokenize(text)]
+        words = list(self.tokenize(text))
          for word in words:
              if self.is_bad_word(word):
          for word in words:
              if self.is_bad_word(word):
-                logger.debug(f'"{word}" is profanity')
+                logger.debug('"%s" is profanity', word)
                  return True
  
          if len(words) > 1:
              for bigram in string_utils.ngrams_presplit(words, 2):
                  bigram = ' '.join(bigram)
                  if self.is_bad_word(bigram):
                  return True
  
          if len(words) > 1:
              for bigram in string_utils.ngrams_presplit(words, 2):
                  bigram = ' '.join(bigram)
                  if self.is_bad_word(bigram):
-                    logger.debug(f'"{bigram}" is profanity')
+                    logger.debug('"%s" is profanity', bigram)
                      return True
  
          if len(words) > 2:
              for trigram in string_utils.ngrams_presplit(words, 3):
                  trigram = ' '.join(trigram)
                  if self.is_bad_word(trigram):
                      return True
  
          if len(words) > 2:
              for trigram in string_utils.ngrams_presplit(words, 3):
                  trigram = ' '.join(trigram)
                  if self.is_bad_word(trigram):
-                    logger.debug(f'"{trigram}" is profanity')
+                    logger.debug('"%s" is profanity', trigram)
                      return True
          return False
  
                      return True
          return False
  
@@ -563,7 +568,7 @@ class ProfanityFilter(object):
                              break
              return out
  
                              break
              return out
  
-        words = [x for x in self.tokenize(text)]
+        words = list(self.tokenize(text))
          words.append('')
          words.append('')
          words.append('')
          words.append('')
          words.append('')
          words.append('')
diff --git a/remote_worker.py b/remote_worker.py

index 82b80ea3d722090ab7254eb24eac5884a9520172..75dfe8e46cb3d34e28f44267129ff38020d23a7a 100755 (executable)
--- a/remote_worker.py
+++ b/remote_worker.py
@@ -59,14 +59,12 @@ def watch_for_cancel(terminate_event: threading.Event) -> None:
          for ancestor in ancestors:
              name = ancestor.name()
              pid = ancestor.pid
          for ancestor in ancestors:
              name = ancestor.name()
              pid = ancestor.pid
-            logger.debug(f'Ancestor process {name} (pid={pid})')
+            logger.debug('Ancestor process %s (pid=%d)', name, pid)
              if 'ssh' in name.lower():
                  saw_sshd = True
                  break
          if not saw_sshd:
              if 'ssh' in name.lower():
                  saw_sshd = True
                  break
          if not saw_sshd:
-            logger.error(
-                'Did not see sshd in our ancestors list?!  Committing suicide.'
-            )
+            logger.error('Did not see sshd in our ancestors list?!  Committing suicide.')
              os.system('pstree')
              os.kill(os.getpid(), signal.SIGTERM)
              time.sleep(5.0)
              os.system('pstree')
              os.kill(os.getpid(), signal.SIGTERM)
              time.sleep(5.0)
@@ -99,43 +97,43 @@ def main() -> None:
      if config.config['watch_for_cancel']:
          (thread, stop_thread) = watch_for_cancel()
  
      if config.config['watch_for_cancel']:
          (thread, stop_thread) = watch_for_cancel()
  
-    logger.debug(f'Reading {in_file}.')
+    logger.debug('Reading %s.', in_file)
      try:
          with open(in_file, 'rb') as rb:
              serialized = rb.read()
      except Exception as e:
          logger.exception(e)
      try:
          with open(in_file, 'rb') as rb:
              serialized = rb.read()
      except Exception as e:
          logger.exception(e)
-        logger.critical(f'Problem reading {in_file}.  Aborting.')
+        logger.critical('Problem reading %s. Aborting.', in_file)
          cleanup_and_exit(thread, stop_thread, 1)
  
          cleanup_and_exit(thread, stop_thread, 1)
  
-    logger.debug(f'Deserializing {in_file}.')
+    logger.debug('Deserializing %s', in_file)
      try:
          fun, args, kwargs = cloudpickle.loads(serialized)
      except Exception as e:
          logger.exception(e)
      try:
          fun, args, kwargs = cloudpickle.loads(serialized)
      except Exception as e:
          logger.exception(e)
-        logger.critical(f'Problem deserializing {in_file}.  Aborting.')
+        logger.critical('Problem deserializing %s. Aborting.', in_file)
          cleanup_and_exit(thread, stop_thread, 2)
  
      logger.debug('Invoking user code...')
      with Timer() as t:
          ret = fun(*args, **kwargs)
          cleanup_and_exit(thread, stop_thread, 2)
  
      logger.debug('Invoking user code...')
      with Timer() as t:
          ret = fun(*args, **kwargs)
-    logger.debug(f'User code took {t():.1f}s')
+    logger.debug('User code took %.1fs', t())
  
      logger.debug('Serializing results')
      try:
          serialized = cloudpickle.dumps(ret)
      except Exception as e:
          logger.exception(e)
  
      logger.debug('Serializing results')
      try:
          serialized = cloudpickle.dumps(ret)
      except Exception as e:
          logger.exception(e)
-        logger.critical(f'Could not serialize result ({type(ret)}).  Aborting.')
+        logger.critical('Could not serialize result (%s). Aborting.', type(ret))
          cleanup_and_exit(thread, stop_thread, 3)
  
          cleanup_and_exit(thread, stop_thread, 3)
  
-    logger.debug(f'Writing {out_file}.')
+    logger.debug('Writing %s', out_file)
      try:
          with open(out_file, 'wb') as wb:
              wb.write(serialized)
      except Exception as e:
          logger.exception(e)
      try:
          with open(out_file, 'wb') as wb:
              wb.write(serialized)
      except Exception as e:
          logger.exception(e)
-        logger.critical(f'Error writing {out_file}.  Aborting.')
+        logger.critical('Error writing %s. Aborting.', out_file)
          cleanup_and_exit(thread, stop_thread, 4)
      cleanup_and_exit(thread, stop_thread, 0)
  
          cleanup_and_exit(thread, stop_thread, 4)
      cleanup_and_exit(thread, stop_thread, 0)
  
diff --git a/site_config.py b/site_config.py

index fcf22a8d2cf20d4e6a6dd83690a51de08ce2f44d..7f6410d39356c1d0d8f910cfcece67eaf4cff29e 100644 (file)
--- a/site_config.py
+++ b/site_config.py
@@ -1,5 +1,7 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""Location/site dependent data."""
+
  import logging
  import platform
  from dataclasses import dataclass
  import logging
  import platform
  from dataclasses import dataclass
@@ -27,6 +29,8 @@ args.add_argument(
  
  @dataclass
  class SiteConfig(object):
  
  @dataclass
  class SiteConfig(object):
+    """The set of information specific to where the program is running."""
+
      location_name: str
      location: Location
      network: str
      location_name: str
      location: Location
      network: str
@@ -129,7 +133,7 @@ def effective_location(location_override: Optional[str] = None) -> str:
      if location_override is None or location_override == 'NONE':
          location = this_location()
      else:
      if location_override is None or location_override == 'NONE':
          location = this_location()
      else:
-        logger.debug(f'site_config\'s location_override was set to: {location_override}')
+        logger.debug('site_config\'s location_override was set to: %s', location_override)
          location = location_override
      return location
  
          location = location_override
      return location
  
diff --git a/smart_future.py b/smart_future.py

index 460dcb95862a9a88ecafde45fa8886dbcbb9eaa1..9aa68f38a5396953636e257032542f9d07533225 100644 (file)
--- a/smart_future.py
+++ b/smart_future.py
@@ -1,11 +1,15 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""A future that can be treated like the result that it contains and
+will not block until it is used.  At that point, if the underlying
+value is not yet available, it will block until it becomes
+available."""
+
  from __future__ import annotations
  
  import concurrent
  import concurrent.futures as fut
  import logging
  from __future__ import annotations
  
  import concurrent
  import concurrent.futures as fut
  import logging
-import traceback
  from typing import Callable, List, Set, TypeVar
  
  from overrides import overrides
  from typing import Callable, List, Set, TypeVar
  
  from overrides import overrides
@@ -31,7 +35,7 @@ def wait_any(
      smart_future_by_real_future = {}
      completed_futures: Set[fut.Future] = set()
      for x in futures:
      smart_future_by_real_future = {}
      completed_futures: Set[fut.Future] = set()
      for x in futures:
-        assert type(x) == SmartFuture
+        assert isinstance(x, SmartFuture)
          real_futures.append(x.wrapped_future)
          smart_future_by_real_future[x.wrapped_future] = x
  
          real_futures.append(x.wrapped_future)
          smart_future_by_real_future[x.wrapped_future] = x
  
@@ -44,15 +48,12 @@ def wait_any(
              if log_exceptions and not f.cancelled():
                  exception = f.exception()
                  if exception is not None:
              if log_exceptions and not f.cancelled():
                  exception = f.exception()
                  if exception is not None:
-                    logger.warning(
-                        f'Future {id(f)} raised an unhandled exception and exited.'
-                    )
+                    logger.warning('Future 0x%x raised an unhandled exception and exited.', id(f))
                      logger.exception(exception)
                      raise exception
              yield smart_future_by_real_future[f]
      if callback is not None:
          callback()
                      logger.exception(exception)
                      raise exception
              yield smart_future_by_real_future[f]
      if callback is not None:
          callback()
-    return
  
  
  def wait_all(
  
  
  def wait_all(
@@ -62,7 +63,7 @@ def wait_all(
  ) -> None:
      real_futures = []
      for x in futures:
  ) -> None:
      real_futures = []
      for x in futures:
-        assert type(x) == SmartFuture
+        assert isinstance(x, SmartFuture)
          real_futures.append(x.wrapped_future)
  
      (done, not_done) = concurrent.futures.wait(
          real_futures.append(x.wrapped_future)
  
      (done, not_done) = concurrent.futures.wait(
@@ -73,9 +74,7 @@ def wait_all(
              if not f.cancelled():
                  exception = f.exception()
                  if exception is not None:
              if not f.cancelled():
                  exception = f.exception()
                  if exception is not None:
-                    logger.warning(
-                        f'Future {id(f)} raised an unhandled exception and exited.'
-                    )
+                    logger.warning('Future 0x%x raised an unhandled exception and exited.', id(f))
                      logger.exception(exception)
                      raise exception
      assert len(done) == len(real_futures)
                      logger.exception(exception)
                      raise exception
      assert len(done) == len(real_futures)
@@ -91,7 +90,7 @@ class SmartFuture(DeferredOperand):
      """
  
      def __init__(self, wrapped_future: fut.Future) -> None:
      """
  
      def __init__(self, wrapped_future: fut.Future) -> None:
-        assert type(wrapped_future) == fut.Future
+        assert isinstance(wrapped_future, fut.Future)
          self.wrapped_future = wrapped_future
          self.id = id_generator.get("smart_future_id")
  
          self.wrapped_future = wrapped_future
          self.id = id_generator.get("smart_future_id")
  
@@ -104,5 +103,5 @@ class SmartFuture(DeferredOperand):
      # You shouldn't have to call this; instead, have a look at defining a
      # method on DeferredOperand base class.
      @overrides
      # You shouldn't have to call this; instead, have a look at defining a
      # method on DeferredOperand base class.
      @overrides
-    def _resolve(self, *, timeout=None) -> T:
+    def _resolve(self, timeout=None) -> T:
          return self.wrapped_future.result(timeout)
          return self.wrapped_future.result(timeout)
diff --git a/state_tracker.py b/state_tracker.py

index e59231560e900305eaadab380746e5b671062242..b375f8928dc09c6f359d6e99846d06f1db947c5e 100644 (file)
--- a/state_tracker.py
+++ b/state_tracker.py
@@ -1,5 +1,10 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""Several helpers to keep track of internal state via periodic
+polling.  StateTracker expects to be invoked periodically to maintain
+state whereas the others automatically update themselves and,
+optionally, expose an event for client code to wait on state changes."""
+
  import datetime
  import logging
  import threading
  import datetime
  import logging
  import threading
@@ -35,6 +40,7 @@ class StateTracker(ABC):
          """
          self.update_ids_to_update_secs = update_ids_to_update_secs
          self.last_reminder_ts: Dict[str, Optional[datetime.datetime]] = {}
          """
          self.update_ids_to_update_secs = update_ids_to_update_secs
          self.last_reminder_ts: Dict[str, Optional[datetime.datetime]] = {}
+        self.now: Optional[datetime.datetime] = None
          for x in update_ids_to_update_secs.keys():
              self.last_reminder_ts[x] = None
  
          for x in update_ids_to_update_secs.keys():
              self.last_reminder_ts[x] = None
  
@@ -80,13 +86,13 @@ class StateTracker(ABC):
              refresh_secs = self.update_ids_to_update_secs[update_id]
              last_run = self.last_reminder_ts[update_id]
              if last_run is None:  # Never run before
              refresh_secs = self.update_ids_to_update_secs[update_id]
              last_run = self.last_reminder_ts[update_id]
              if last_run is None:  # Never run before
-                logger.debug(f'id {update_id} has never been run; running it now')
+                logger.debug('id %s has never been run; running it now', update_id)
                  self.update(update_id, self.now, self.last_reminder_ts[update_id])
                  self.last_reminder_ts[update_id] = self.now
              else:
                  delta = self.now - last_run
                  if delta.total_seconds() >= refresh_secs:  # Is overdue?
                  self.update(update_id, self.now, self.last_reminder_ts[update_id])
                  self.last_reminder_ts[update_id] = self.now
              else:
                  delta = self.now - last_run
                  if delta.total_seconds() >= refresh_secs:  # Is overdue?
-                    logger.debug(f'id {update_id} is overdue; running it now')
+                    logger.debug('id %s is overdue; running it now', update_id)
                      self.update(
                          update_id,
                          self.now,
                      self.update(
                          update_id,
                          self.now,
@@ -114,7 +120,7 @@ class AutomaticStateTracker(StateTracker):
                  logger.debug('pace_maker noticed event; shutting down')
                  return
              self.heartbeat()
                  logger.debug('pace_maker noticed event; shutting down')
                  return
              self.heartbeat()
-            logger.debug(f'pace_maker is sleeping for {self.sleep_delay}s')
+            logger.debug('pace_maker is sleeping for %.1fs', self.sleep_delay)
              time.sleep(self.sleep_delay)
  
      def __init__(
              time.sleep(self.sleep_delay)
  
      def __init__(
@@ -127,12 +133,12 @@ class AutomaticStateTracker(StateTracker):
  
          super().__init__(update_ids_to_update_secs)
          if override_sleep_delay is not None:
  
          super().__init__(update_ids_to_update_secs)
          if override_sleep_delay is not None:
-            logger.debug(f'Overriding sleep delay to {override_sleep_delay}')
+            logger.debug('Overriding sleep delay to %.1f', override_sleep_delay)
              self.sleep_delay = override_sleep_delay
          else:
              periods_list = list(update_ids_to_update_secs.values())
              self.sleep_delay = math_utils.gcd_float_sequence(periods_list)
              self.sleep_delay = override_sleep_delay
          else:
              periods_list = list(update_ids_to_update_secs.values())
              self.sleep_delay = math_utils.gcd_float_sequence(periods_list)
-            logger.info(f'Computed sleep_delay={self.sleep_delay}')
+            logger.info('Computed sleep_delay=%.1f', self.sleep_delay)
          (thread, stop_event) = self.pace_maker()
          self.should_terminate = stop_event
          self.updater_thread = thread
          (thread, stop_event) = self.pace_maker()
          self.should_terminate = stop_event
          self.updater_thread = thread
diff --git a/stopwatch.py b/stopwatch.py

index c6c154c124482c9bf9c9e20950a9cca0fb22cb1d..fa4f2b52f54998bb029f7e14433e5451abd67812 100644 (file)
--- a/stopwatch.py
+++ b/stopwatch.py
@@ -1,5 +1,7 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""A simple stopwatch decorator / context for timing things."""
+
  import time
  from typing import Callable, Optional
  
  import time
  from typing import Callable, Optional
  
diff --git a/string_utils.py b/string_utils.py

index 3c97ff7991726012ff091dc7aa042abb88000bf6..d75c6ba1aca2c559ed4254d535747c54f4719bf5 100644 (file)
--- a/string_utils.py
+++ b/string_utils.py
@@ -1091,7 +1091,6 @@ def valid_date(in_str: str) -> bool:
      """
      True if the string represents a valid date.
      """
      """
      True if the string represents a valid date.
      """
-    import dateparse
      import dateparse.dateparse_utils as dp
  
      try:
      import dateparse.dateparse_utils as dp
  
      try:
@@ -1113,7 +1112,7 @@ def to_datetime(in_str: str) -> Optional[datetime.datetime]:
      try:
          d = dp.DateParser()  # type: ignore
          dt = d.parse(in_str)
      try:
          d = dp.DateParser()  # type: ignore
          dt = d.parse(in_str)
-        if type(dt) == datetime.datetime:
+        if isinstance(dt, datetime.datetime):
              return dt
      except ValueError:
          msg = f'Unable to parse datetime {in_str}.'
              return dt
      except ValueError:
          msg = f'Unable to parse datetime {in_str}.'
@@ -1372,7 +1371,7 @@ def make_contractions(txt: str) -> str:
              for second in second_list:
                  # Disallow there're/where're.  They're valid English
                  # but sound weird.
              for second in second_list:
                  # Disallow there're/where're.  They're valid English
                  # but sound weird.
-                if (first == 'there' or first == 'where') and second == 'a(re)':
+                if (first in ('there', 'where')) and second == 'a(re)':
                      continue
  
                  pattern = fr'\b({first})\s+{second}\b'
                      continue
  
                  pattern = fr'\b({first})\s+{second}\b'
@@ -1458,11 +1457,11 @@ def shuffle_columns_into_list(
      # Column specs map input lines' columns into outputs.
      # [col1, col2...]
      for spec in column_specs:
      # Column specs map input lines' columns into outputs.
      # [col1, col2...]
      for spec in column_specs:
-        chunk = ''
+        hunk = ''
          for n in spec:
          for n in spec:
-            chunk = chunk + delim + input_lines[n]
-        chunk = chunk.strip(delim)
-        out.append(chunk)
+            hunk = hunk + delim + input_lines[n]
+        hunk = hunk.strip(delim)
+        out.append(hunk)
      return out
  
  
      return out
  
  
@@ -1488,11 +1487,11 @@ def shuffle_columns_into_dict(
      # Column specs map input lines' columns into outputs.
      # "key", [col1, col2...]
      for spec in column_specs:
      # Column specs map input lines' columns into outputs.
      # "key", [col1, col2...]
      for spec in column_specs:
-        chunk = ''
+        hunk = ''
          for n in spec[1]:
          for n in spec[1]:
-            chunk = chunk + delim + input_lines[n]
-        chunk = chunk.strip(delim)
-        out[spec[0]] = chunk
+            hunk = hunk + delim + input_lines[n]
+        hunk = hunk.strip(delim)
+        out[spec[0]] = hunk
      return out
  
  
      return out
  
  
@@ -1517,9 +1516,9 @@ def to_ascii(x: str):
      b'1, 2, 3'
  
      """
      b'1, 2, 3'
  
      """
-    if type(x) is str:
+    if isinstance(x, str):
          return x.encode('ascii')
          return x.encode('ascii')
-    if type(x) is bytes:
+    if isinstance(x, bytes):
          return x
      raise Exception('to_ascii works with strings and bytes')
  
          return x
      raise Exception('to_ascii works with strings and bytes')
  
diff --git a/text_utils.py b/text_utils.py

index 76cc7e816db9ae87581989bc314fd7d07d4ca154..4384a1e6134810982e9227d2bb1dfdb517627f72 100644 (file)
--- a/text_utils.py
+++ b/text_utils.py
@@ -15,6 +15,8 @@ logger = logging.getLogger(__file__)
  
  
  class RowsColumns(NamedTuple):
  
  
  class RowsColumns(NamedTuple):
+    """Row + Column"""
+
      rows: int
      columns: int
  
      rows: int
      columns: int
  
@@ -31,7 +33,7 @@ def get_console_rows_columns() -> RowsColumns:
          ).split()
      except Exception as e:
          logger.exception(e)
          ).split()
      except Exception as e:
          logger.exception(e)
-        raise Exception('Can\'t determine console size?!')
+        raise Exception('Can\'t determine console size?!') from e
      return RowsColumns(int(rows), int(columns))
  
  
      return RowsColumns(int(rows), int(columns))
  
  
@@ -122,10 +124,10 @@ def sparkline(numbers: List[float]) -> Tuple[float, float, str]:
      barcount = len(_bar)
      min_num, max_num = min(numbers), max(numbers)
      span = max_num - min_num
      barcount = len(_bar)
      min_num, max_num = min(numbers), max(numbers)
      span = max_num - min_num
-    sparkline = ''.join(
+    sline = ''.join(
          _bar[min([barcount - 1, int((n - min_num) / span * barcount)])] for n in numbers
      )
          _bar[min([barcount - 1, int((n - min_num) / span * barcount)])] for n in numbers
      )
-    return min_num, max_num, sparkline
+    return min_num, max_num, sline
  
  
  def distribute_strings(
  
  
  def distribute_strings(
diff --git a/thread_utils.py b/thread_utils.py

index 22161275605d76a1199df8f18d536fd04e2fe17b..4db4cf68b4ef916f323f90bae492d1c59dca361f 100644 (file)
--- a/thread_utils.py
+++ b/thread_utils.py
@@ -1,5 +1,7 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""Utilities for dealing with threads + threading."""
+
  import functools
  import logging
  import os
  import functools
  import logging
  import os
@@ -104,7 +106,7 @@ def background_thread(
                  kwargs=kwa,
              )
              thread.start()
                  kwargs=kwa,
              )
              thread.start()
-            logger.debug(f'Started thread {thread.name} tid={thread.ident}')
+            logger.debug('Started thread "%s" tid=%d', thread.name, thread.ident)
              return (thread, should_terminate)
  
          return inner_wrapper
              return (thread, should_terminate)
  
          return inner_wrapper
@@ -163,7 +165,7 @@ def periodically_invoke(
              newargs = (should_terminate, *args)
              thread = threading.Thread(target=helper_thread, args=newargs, kwargs=kwargs)
              thread.start()
              newargs = (should_terminate, *args)
              thread = threading.Thread(target=helper_thread, args=newargs, kwargs=kwargs)
              thread.start()
-            logger.debug(f'Started thread {thread.name} tid={thread.ident}')
+            logger.debug('Started thread "%s" tid=%d', thread.name, thread.ident)
              return (thread, should_terminate)
  
          return wrapper_repeat
              return (thread, should_terminate)
  
          return wrapper_repeat
diff --git a/type_utils.py b/type_utils.py

index 1584597c039bc6a78900f28e3182ed64e601059d..c2f432a2306fee2a828eaf8b9d0de41c224d3380 100644 (file)
--- a/type_utils.py
+++ b/type_utils.py
@@ -1,5 +1,7 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""Utility functions for dealing with typing."""
+
  import logging
  from typing import Any, Optional
  
  import logging
  from typing import Any, Optional
  
diff --git a/unittest_utils.py b/unittest_utils.py

index f229df75e8b88825d66ca227d7e907d3dc725e1a..70e588e2fa8025b2a70941b9837c78fb3f65421c 100644 (file)
--- a/unittest_utils.py
+++ b/unittest_utils.py
@@ -76,6 +76,9 @@ unittest.main = bootstrap.initialize(unittest.main)
  
  
  class PerfRegressionDataPersister(ABC):
  
  
  class PerfRegressionDataPersister(ABC):
+    """A base class for a signature dealing with persisting perf
+    regression data."""
+
      def __init__(self):
          pass
  
      def __init__(self):
          pass
  
@@ -93,7 +96,10 @@ class PerfRegressionDataPersister(ABC):
  
  
  class FileBasedPerfRegressionDataPersister(PerfRegressionDataPersister):
  
  
  class FileBasedPerfRegressionDataPersister(PerfRegressionDataPersister):
+    """A perf regression data persister that uses files."""
+
      def __init__(self, filename: str):
      def __init__(self, filename: str):
+        super().__init__()
          self.filename = filename
          self.traces_to_delete: List[str] = []
  
          self.filename = filename
          self.traces_to_delete: List[str] = []
  
@@ -114,7 +120,10 @@ class FileBasedPerfRegressionDataPersister(PerfRegressionDataPersister):
  
  
  class DatabasePerfRegressionDataPersister(PerfRegressionDataPersister):
  
  
  class DatabasePerfRegressionDataPersister(PerfRegressionDataPersister):
+    """A perf regression data persister that uses a database backend."""
+
      def __init__(self, dbspec: str):
      def __init__(self, dbspec: str):
+        super().__init__()
          self.dbspec = dbspec
          self.engine = sa.create_engine(self.dbspec)
          self.conn = self.engine.connect()
          self.dbspec = dbspec
          self.engine = sa.create_engine(self.dbspec)
          self.conn = self.engine.connect()
@@ -131,10 +140,10 @@ class DatabasePerfRegressionDataPersister(PerfRegressionDataPersister):
  
      def save_performance_data(self, method_id: str, data: Dict[str, List[float]]):
          self.delete_performance_data(method_id)
  
      def save_performance_data(self, method_id: str, data: Dict[str, List[float]]):
          self.delete_performance_data(method_id)
-        for (method_id, perf_data) in data.items():
+        for (mid, perf_data) in data.items():
              sql = 'INSERT INTO runtimes_by_function (function, runtime) VALUES '
              for perf in perf_data:
              sql = 'INSERT INTO runtimes_by_function (function, runtime) VALUES '
              for perf in perf_data:
-                self.conn.execute(sql + f'("{method_id}", {perf});')
+                self.conn.execute(sql + f'("{mid}", {perf});')
  
      def delete_performance_data(self, method_id: str):
          sql = f'DELETE FROM runtimes_by_function WHERE function = "{method_id}"'
  
      def delete_performance_data(self, method_id: str):
          sql = f'DELETE FROM runtimes_by_function WHERE function = "{method_id}"'
@@ -168,8 +177,8 @@ def check_method_for_perf_regressions(func: Callable) -> Callable:
  
          func_id = function_utils.function_identifier(func)
          func_name = func.__name__
  
          func_id = function_utils.function_identifier(func)
          func_name = func.__name__
-        logger.debug(f'Watching {func_name}\'s performance...')
-        logger.debug(f'Canonical function identifier = {func_id}')
+        logger.debug('Watching %s\'s performance...', func_name)
+        logger.debug('Canonical function identifier = "%s"', func_id)
  
          try:
              perfdb = helper.load_performance_data(func_id)
  
          try:
              perfdb = helper.load_performance_data(func_id)
@@ -195,15 +204,15 @@ def check_method_for_perf_regressions(func: Callable) -> Callable:
          hist = perfdb.get(func_id, [])
          if len(hist) < config.config['unittests_num_perf_samples']:
              hist.append(run_time)
          hist = perfdb.get(func_id, [])
          if len(hist) < config.config['unittests_num_perf_samples']:
              hist.append(run_time)
-            logger.debug(f'Still establishing a perf baseline for {func_name}')
+            logger.debug('Still establishing a perf baseline for %s', func_name)
          else:
              stdev = statistics.stdev(hist)
          else:
              stdev = statistics.stdev(hist)
-            logger.debug(f'For {func_name}, performance stdev={stdev}')
+            logger.debug('For %s, performance stdev=%.2f', func_name, stdev)
              slowest = hist[-1]
              slowest = hist[-1]
-            logger.debug(f'For {func_name}, slowest perf on record is {slowest:f}s')
+            logger.debug('For %s, slowest perf on record is %.2fs', func_name, slowest)
              limit = slowest + stdev * 4
              limit = slowest + stdev * 4
-            logger.debug(f'For {func_name}, max acceptable runtime is {limit:f}s')
-            logger.debug(f'For {func_name}, actual observed runtime was {run_time:f}s')
+            logger.debug('For %s, max acceptable runtime is %.2fs', func_name, limit)
+            logger.debug('For %s, actual observed runtime was %.2fs', func_name, run_time)
              if run_time > limit:
                  msg = f'''{func_id} performance has regressed unacceptably.
  {slowest:f}s is the slowest runtime on record in {len(hist)} perf samples.
              if run_time > limit:
                  msg = f'''{func_id} performance has regressed unacceptably.
  {slowest:f}s is the slowest runtime on record in {len(hist)} perf samples.
@@ -250,7 +259,7 @@ def check_all_methods_for_perf_regressions(prefix='test_'):
              for name, m in inspect.getmembers(cls, inspect.isfunction):
                  if name.startswith(prefix):
                      setattr(cls, name, check_method_for_perf_regressions(m))
              for name, m in inspect.getmembers(cls, inspect.isfunction):
                  if name.startswith(prefix):
                      setattr(cls, name, check_method_for_perf_regressions(m))
-                    logger.debug(f'Wrapping {cls.__name__}:{name}.')
+                    logger.debug('Wrapping %s:%s.', cls.__name__, name)
          return cls
  
      return decorate_the_testcase
          return cls
  
      return decorate_the_testcase
diff --git a/unscrambler.py b/unscrambler.py

index c5bc9b5f15200c0f909af2bd5f849be6fa60b809..1b242309b649eaa036277fdb22fc6f9c7705f0c8 100644 (file)
--- a/unscrambler.py
+++ b/unscrambler.py
@@ -1,5 +1,7 @@
  #!/usr/bin/env python3
  
  #!/usr/bin/env python3
  
+"""A fast word unscrambler library."""
+
  import logging
  from typing import Dict, Mapping, Optional
  
  import logging
  from typing import Dict, Mapping, Optional
  
@@ -21,10 +23,10 @@ cfg.add_argument(
  logger = logging.getLogger(__name__)
  
  letters_bits = 32
  logger = logging.getLogger(__name__)
  
  letters_bits = 32
-letters_mask = 2 ** letters_bits - 1
+letters_mask = 2**letters_bits - 1
  
  fprint_bits = 52
  
  fprint_bits = 52
-fprint_mask = (2 ** fprint_bits - 1) << letters_bits
+fprint_mask = (2**fprint_bits - 1) << letters_bits
  
  fprint_feature_bit = {
      'e': 0,
  
  fprint_feature_bit = {
      'e': 0,
@@ -106,7 +108,7 @@ class Unscrambler(object):
          self.sigs = []
          self.words = []
  
          self.sigs = []
          self.words = []
  
-        filename = self.get_indexfile(indexfile)
+        filename = Unscrambler.get_indexfile(indexfile)
          with open(filename, 'r') as rf:
              lines = rf.readlines()
          for line in lines:
          with open(filename, 'r') as rf:
              lines = rf.readlines()
          for line in lines:
@@ -116,7 +118,8 @@ class Unscrambler(object):
              self.sigs.append(isig)
              self.words.append(word)
  
              self.sigs.append(isig)
              self.words.append(word)
  
-    def get_indexfile(self, indexfile: Optional[str]) -> str:
+    @staticmethod
+    def get_indexfile(indexfile: Optional[str]) -> str:
          if indexfile is None:
              if 'unscrambler_default_indexfile' in config.config:
                  indexfile = config.config['unscramble_indexfile']
          if indexfile is None:
              if 'unscrambler_default_indexfile' in config.config:
                  indexfile = config.config['unscramble_indexfile']
@@ -193,7 +196,6 @@ class Unscrambler(object):
  
      @staticmethod
      def repopulate(
  
      @staticmethod
      def repopulate(
-        lsigs: Dict[str, int],
          dictfile: str = '/usr/share/dict/words',
          indexfile: str = '/usr/share/dict/sparse_index',
      ) -> None:
          dictfile: str = '/usr/share/dict/words',
          indexfile: str = '/usr/share/dict/sparse_index',
      ) -> None:
author	Scott Gasch <scott@gasch.org>
	Wed, 9 Feb 2022 01:46:56 +0000 (17:46 -0800)
committer	Scott Gasch <scott@gasch.org>
	Wed, 9 Feb 2022 01:46:56 +0000 (17:46 -0800)
function_utils.py		patch \| blob \| history
google_assistant.py		patch \| blob \| history
histogram.py		patch \| blob \| history
id_generator.py		patch \| blob \| history
input_utils.py		patch \| blob \| history
letter_compress.py		patch \| blob \| history
list_utils.py		patch \| blob \| history
lockfile.py		patch \| blob \| history
logging_utils.py		patch \| blob \| history
logical_search.py		patch \| blob \| history
math_utils.py		patch \| blob \| history
misc_utils.py		patch \| blob \| history
parallelize.py		patch \| blob \| history
persistent.py		patch \| blob \| history
profanity_filter.py		patch \| blob \| history
remote_worker.py		patch \| blob \| history
site_config.py		patch \| blob \| history
smart_future.py		patch \| blob \| history
state_tracker.py		patch \| blob \| history
stopwatch.py		patch \| blob \| history
string_utils.py		patch \| blob \| history
text_utils.py		patch \| blob \| history
thread_utils.py		patch \| blob \| history
type_utils.py		patch \| blob \| history
unittest_utils.py		patch \| blob \| history
unscrambler.py		patch \| blob \| history