From 19efdfeb4ad348ba10bb17c5796bf4c7546ba466 Mon Sep 17 00:00:00 2001 From: Saran Ahluwalia Date: Sat, 4 Dec 2021 12:38:50 -0500 Subject: [PATCH] DoE LEAD References Need to be Updated (#976) * replace temporary fieldnames that are not found and indexed * fixed field names * PR review * PR review - revert Co-authored-by: Saran Ahluwalia --- .../data_pipeline/etl/sources/doe_energy_burden/etl.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py b/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py index 358061ce..7889d2f6 100644 --- a/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py +++ b/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py @@ -43,7 +43,7 @@ class DOEEnergyBurden(ExtractTransformLoad): self.raw_df = pd.read_csv( filepath_or_buffer=self.TMP_PATH / "doe_energy_burden" - / "DOE_LEAD_with_EJSCREEN.csv", + / "DOE_LEAD_AMI_TRACT_2018_ALL.csv", # The following need to remain as strings for all of their digits, not get converted to numbers. dtype={ self.TRACT_INPUT_COLUMN_NAME: "string", @@ -56,7 +56,7 @@ class DOEEnergyBurden(ExtractTransformLoad): output_df = self.raw_df.rename( columns={ - "AvgEnergyBurden": self.ENERGY_BURDEN_FIELD_NAME, + "BURDEN": self.ENERGY_BURDEN_FIELD_NAME, self.TRACT_INPUT_COLUMN_NAME: self.GEOID_TRACT_FIELD_NAME, } ) @@ -78,7 +78,7 @@ class DOEEnergyBurden(ExtractTransformLoad): def load(self) -> None: logger.info("Saving DOE Energy Burden CSV") - + self.OUTPUT_PATH.mkdir(parents=True, exist_ok=True) self.output_df[self.COLUMNS_TO_KEEP].to_csv( path_or_buf=self.OUTPUT_PATH / "usa.csv", index=False