mirror of
https://github.com/DOI-DO/j40-cejst-2.git
synced 2025-02-22 09:41:26 -08:00
Move Housing and Transportation Index to tracts (#903)
Update data download URL to use tract as focus, use tract field name, and move this dataset to the tracts df list in etl_score. Co-authored-by: Shelby Switzer <shelby.switzer@cms.hhs.gov>
This commit is contained in:
parent
776a52595f
commit
0c8b32e679
2 changed files with 7 additions and 7 deletions
|
@ -226,7 +226,6 @@ class ScoreETL(ExtractTransformLoad):
|
|||
census_block_group_dfs = [
|
||||
self.ejscreen_df,
|
||||
self.census_df,
|
||||
self.housing_and_transportation_df,
|
||||
self.census_acs_median_incomes_df,
|
||||
self.national_risk_index_df,
|
||||
]
|
||||
|
@ -241,6 +240,7 @@ class ScoreETL(ExtractTransformLoad):
|
|||
self.doe_energy_burden_df,
|
||||
self.geocorr_urban_rural_df,
|
||||
self.persistent_poverty_df,
|
||||
self.housing_and_transportation_df,
|
||||
]
|
||||
census_tract_df = self._join_tract_dfs(census_tract_dfs)
|
||||
|
||||
|
|
|
@ -11,7 +11,7 @@ logger = get_module_logger(__name__)
|
|||
class HousingTransportationETL(ExtractTransformLoad):
|
||||
def __init__(self):
|
||||
self.HOUSING_FTP_URL = (
|
||||
"https://htaindex.cnt.org/download/download.php?focus=blkgrp&geoid="
|
||||
"https://htaindex.cnt.org/download/download.php?focus=tract&geoid="
|
||||
)
|
||||
self.OUTPUT_PATH = (
|
||||
self.DATA_PATH / "dataset" / "housing_and_transportation_index"
|
||||
|
@ -33,7 +33,7 @@ class HousingTransportationETL(ExtractTransformLoad):
|
|||
|
||||
# New file name:
|
||||
tmp_csv_file_path = (
|
||||
zip_file_dir / f"htaindex_data_blkgrps_{fips}.csv"
|
||||
zip_file_dir / f"htaindex_data_tracts_{fips}.csv"
|
||||
)
|
||||
|
||||
try:
|
||||
|
@ -50,10 +50,10 @@ class HousingTransportationETL(ExtractTransformLoad):
|
|||
def transform(self) -> None:
|
||||
logger.info("Transforming Housing and Transportation Data")
|
||||
|
||||
# Rename and reformat block group ID
|
||||
self.df.rename(columns={"blkgrp": self.GEOID_FIELD_NAME}, inplace=True)
|
||||
self.df[self.GEOID_FIELD_NAME] = self.df[
|
||||
self.GEOID_FIELD_NAME
|
||||
# Rename and reformat tract ID
|
||||
self.df.rename(columns={"tract": self.GEOID_TRACT_FIELD_NAME}, inplace=True)
|
||||
self.df[self.GEOID_TRACT_FIELD_NAME] = self.df[
|
||||
self.GEOID_TRACT_FIELD_NAME
|
||||
].str.replace('"', "")
|
||||
|
||||
def load(self) -> None:
|
||||
|
|
Loading…
Add table
Reference in a new issue