DoE LEAD References Need to be Updated (#976)

* replace temporary fieldnames that are not found and indexed

* fixed field names

* PR review

* PR review - revert

Co-authored-by: Saran Ahluwalia <sarahluw@cisco.com>
This commit is contained in:
Saran Ahluwalia 2021-12-04 12:38:50 -05:00 committed by GitHub
parent c5dff6e5f7
commit 19efdfeb4a
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23

View file

@ -43,7 +43,7 @@ class DOEEnergyBurden(ExtractTransformLoad):
self.raw_df = pd.read_csv(
filepath_or_buffer=self.TMP_PATH
/ "doe_energy_burden"
/ "DOE_LEAD_with_EJSCREEN.csv",
/ "DOE_LEAD_AMI_TRACT_2018_ALL.csv",
# The following need to remain as strings for all of their digits, not get converted to numbers.
dtype={
self.TRACT_INPUT_COLUMN_NAME: "string",
@ -56,7 +56,7 @@ class DOEEnergyBurden(ExtractTransformLoad):
output_df = self.raw_df.rename(
columns={
"AvgEnergyBurden": self.ENERGY_BURDEN_FIELD_NAME,
"BURDEN": self.ENERGY_BURDEN_FIELD_NAME,
self.TRACT_INPUT_COLUMN_NAME: self.GEOID_TRACT_FIELD_NAME,
}
)
@ -78,7 +78,7 @@ class DOEEnergyBurden(ExtractTransformLoad):
def load(self) -> None:
logger.info("Saving DOE Energy Burden CSV")
self.OUTPUT_PATH.mkdir(parents=True, exist_ok=True)
self.output_df[self.COLUMNS_TO_KEEP].to_csv(
path_or_buf=self.OUTPUT_PATH / "usa.csv", index=False