From 8cb9d197df0c5bed18974bd17ac68788d34d6986 Mon Sep 17 00:00:00 2001 From: Saran Ahluwalia Date: Fri, 3 Dec 2021 13:33:19 -0500 Subject: [PATCH] updated doe enerygy link and changed fieldnames - removed computation step as BURDEN is already ratio (#963) Co-authored-by: Saran Ahluwalia --- .../etl/sources/doe_energy_burden/etl.py | 11 +++-------- 1 file changed, 3 insertions(+), 8 deletions(-) diff --git a/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py b/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py index e764e997..358061ce 100644 --- a/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py +++ b/data/data-pipeline/data_pipeline/etl/sources/doe_energy_burden/etl.py @@ -12,15 +12,15 @@ class DOEEnergyBurden(ExtractTransformLoad): def __init__(self): self.DOE_FILE_URL = ( settings.AWS_JUSTICE40_DATASOURCES_URL - + "/DOE_LEAD_with_EJSCREEN.csv.zip" + + "/DOE_LEAD_AMI_TRACT_2018_ALL.csv.zip" ) self.OUTPUT_PATH: Path = ( self.DATA_PATH / "dataset" / "doe_energy_burden" ) - self.TRACT_INPUT_COLUMN_NAME = "GEOID" - self.ENERGY_BURDEN_FIELD_NAME = "Energy burden" + self.TRACT_INPUT_COLUMN_NAME = "FIP" + self.ENERGY_BURDEN_FIELD_NAME = "BURDEN" # Constants for output self.COLUMNS_TO_KEEP = [ @@ -61,11 +61,6 @@ class DOEEnergyBurden(ExtractTransformLoad): } ) - # Convert energy burden to a fraction, since we represent all other percentages as fractions. - output_df[self.ENERGY_BURDEN_FIELD_NAME] = ( - output_df[self.ENERGY_BURDEN_FIELD_NAME] / 100 - ) - # Left-pad the tracts with 0s expected_length_of_census_tract_field = 11 output_df[self.GEOID_TRACT_FIELD_NAME] = (