From 3776e248da78916d08f7b085b3ab2649cd5ffd08 Mon Sep 17 00:00:00 2001 From: matt bowen Date: Wed, 10 Aug 2022 14:15:43 -0400 Subject: [PATCH] Update per code review (#1518) --- data/data-pipeline/data_pipeline/etl/score/config/datasets.yml | 2 +- .../data_pipeline/etl/sources/doe_energy_burden/etl.py | 3 ++- 2 files changed, 3 insertions(+), 2 deletions(-) diff --git a/data/data-pipeline/data_pipeline/etl/score/config/datasets.yml b/data/data-pipeline/data_pipeline/etl/score/config/datasets.yml index 13b06aedc..5316fadde 100644 --- a/data/data-pipeline/data_pipeline/etl/score/config/datasets.yml +++ b/data/data-pipeline/data_pipeline/etl/score/config/datasets.yml @@ -117,7 +117,7 @@ datasets: field_type: float include_in_downloadable_files: true include_in_tiles: true - - long_name: "Exaple ETL" + - long_name: "Example ETL" short_name: "Example" module_name: "example_dataset" input_geoid_tract_field_name: "GEOID10_TRACT" diff --git a/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py b/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py index 0f67c4023..52e8d3f05 100644 --- a/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py +++ b/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py @@ -28,7 +28,7 @@ def __init__(self): self.output_df: pd.DataFrame def transform(self) -> None: - logger.info("Starting transforms.") + logger.info("Starting DOE Energy Burden transforms.") raw_df: pd.DataFrame = pd.read_csv( filepath_or_buffer=self.get_tmp_path() / "DOE_LEAD_AMI_TRACT_2018_ALL.csv", @@ -39,6 +39,7 @@ def transform(self) -> None: low_memory=False, ) + logger.info("Renaming columns and ensuring output format is correct") output_df = raw_df.rename( columns={ self.INPUT_ENERGY_BURDEN_FIELD_NAME: self.REVISED_ENERGY_BURDEN_FIELD_NAME,