X-Git-Url: https://wannabe.guru.org/gitweb/?a=blobdiff_plain;f=ml%2Fmodel_trainer.py;h=acd721868a2a9e04de0da364b8d37dcc268b4fee;hb=5f75cf834725ac26b289cc5f157af0cb71cd5f0e;hp=f9e132e18aa20ecf2461db55257b6037a0c13a4e;hpb=bef486c8c06e8d743a98b89910658a615acc8bbc;p=python_utils.git diff --git a/ml/model_trainer.py b/ml/model_trainer.py index f9e132e..acd7218 100644 --- a/ml/model_trainer.py +++ b/ml/model_trainer.py @@ -246,12 +246,12 @@ class TrainingBlueprint(ABC): y.pop() if self.spec.delete_bad_inputs: - msg = f"WARNING: {filename}: missing features or label. DELETING." + msg = f"WARNING: {filename}: missing features or label; expected {self.spec.feature_count} but saw {len(x)}. DELETING." print(msg, file=sys.stderr) logger.warning(msg) os.remove(filename) else: - msg = f"WARNING: {filename}: missing features or label. Skipped." + msg = f"WARNING: {filename}: missing features or label; expected {self.spec.feature_count} but saw {len(x)}. Skipping." print(msg, file=sys.stderr) logger.warning(msg) return (X, y) @@ -356,6 +356,13 @@ class TrainingBlueprint(ABC): import input_utils import string_utils + now: datetime.datetime = datetime_utils.now_pacific() + info = f"""Timestamp: {datetime_utils.datetime_to_string(now)} +Model params: {params} +Training examples: {num_examples} +Training set score: {training_score:.2f}% +Testing set score: {test_score:.2f}%""" + print(f'\n{info}\n') if ( (self.spec.persist_percentage_threshold is not None and test_score > self.spec.persist_percentage_threshold) @@ -376,12 +383,6 @@ class TrainingBlueprint(ABC): print(msg) logger.info(msg) model_info_filename = f"{self.spec.basename}_model_info.txt" - now: datetime.datetime = datetime_utils.now_pacific() - info = f"""Timestamp: {datetime_utils.datetime_to_string(now)} -Model params: {params} -Training examples: {num_examples} -Training set score: {training_score:.2f}% -Testing set score: {test_score:.2f}%""" with open(model_info_filename, "w") as f: f.write(info) msg = f"Wrote {model_info_filename}:"