diff --git a/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py b/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py index 358061ce..7889d2f6 100644 --- a/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py +++ b/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py @@ -43,7 +43,7 @@ class DOEEnergyBurden(ExtractTransformLoad): self.raw_df = pd.read_csv( filepath_or_buffer=self.TMP_PATH / "doe_energy_burden" - / "DOE_LEAD_with_EJSCREEN.csv", + / "DOE_LEAD_AMI_TRACT_2018_ALL.csv", # The following need to remain as strings for all of their digits, not get converted to numbers. dtype={ self.TRACT_INPUT_COLUMN_NAME: "string", @@ -56,7 +56,7 @@ class DOEEnergyBurden(ExtractTransformLoad): output_df = self.raw_df.rename( columns={ - "AvgEnergyBurden": self.ENERGY_BURDEN_FIELD_NAME, + "BURDEN": self.ENERGY_BURDEN_FIELD_NAME, self.TRACT_INPUT_COLUMN_NAME: self.GEOID_TRACT_FIELD_NAME, } ) @@ -78,7 +78,7 @@ class DOEEnergyBurden(ExtractTransformLoad): def load(self) -> None: logger.info("Saving DOE Energy Burden CSV") - + self.OUTPUT_PATH.mkdir(parents=True, exist_ok=True) self.output_df[self.COLUMNS_TO_KEEP].to_csv( path_or_buf=self.OUTPUT_PATH / "usa.csv", index=False