updated doe enerygy link and changed fieldnames - removed computation step as BURDEN is already ratio (#963)

Co-authored-by: Saran Ahluwalia <sarahluw@cisco.com>
This commit is contained in:
Saran Ahluwalia 2021-12-03 13:33:19 -05:00 committed by GitHub
commit 8cb9d197df
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23

View file

@ -12,15 +12,15 @@ class DOEEnergyBurden(ExtractTransformLoad):
def __init__(self):
self.DOE_FILE_URL = (
settings.AWS_JUSTICE40_DATASOURCES_URL
+ "/DOE_LEAD_with_EJSCREEN.csv.zip"
+ "/DOE_LEAD_AMI_TRACT_2018_ALL.csv.zip"
)
self.OUTPUT_PATH: Path = (
self.DATA_PATH / "dataset" / "doe_energy_burden"
)
self.TRACT_INPUT_COLUMN_NAME = "GEOID"
self.ENERGY_BURDEN_FIELD_NAME = "Energy burden"
self.TRACT_INPUT_COLUMN_NAME = "FIP"
self.ENERGY_BURDEN_FIELD_NAME = "BURDEN"
# Constants for output
self.COLUMNS_TO_KEEP = [
@ -61,11 +61,6 @@ class DOEEnergyBurden(ExtractTransformLoad):
}
)
# Convert energy burden to a fraction, since we represent all other percentages as fractions.
output_df[self.ENERGY_BURDEN_FIELD_NAME] = (
output_df[self.ENERGY_BURDEN_FIELD_NAME] / 100
)
# Left-pad the tracts with 0s
expected_length_of_census_tract_field = 11
output_df[self.GEOID_TRACT_FIELD_NAME] = (