mirror of
https://github.com/DOI-DO/j40-cejst-2.git
synced 2025-02-23 18:14:19 -08:00
Move Housing and Transportation Index to tracts (#903)
Update data download URL to use tract as focus, use tract field name, and move this dataset to the tracts df list in etl_score. Co-authored-by: Shelby Switzer <shelby.switzer@cms.hhs.gov>
This commit is contained in:
parent
776a52595f
commit
0c8b32e679
2 changed files with 7 additions and 7 deletions
|
@ -226,7 +226,6 @@ class ScoreETL(ExtractTransformLoad):
|
||||||
census_block_group_dfs = [
|
census_block_group_dfs = [
|
||||||
self.ejscreen_df,
|
self.ejscreen_df,
|
||||||
self.census_df,
|
self.census_df,
|
||||||
self.housing_and_transportation_df,
|
|
||||||
self.census_acs_median_incomes_df,
|
self.census_acs_median_incomes_df,
|
||||||
self.national_risk_index_df,
|
self.national_risk_index_df,
|
||||||
]
|
]
|
||||||
|
@ -241,6 +240,7 @@ class ScoreETL(ExtractTransformLoad):
|
||||||
self.doe_energy_burden_df,
|
self.doe_energy_burden_df,
|
||||||
self.geocorr_urban_rural_df,
|
self.geocorr_urban_rural_df,
|
||||||
self.persistent_poverty_df,
|
self.persistent_poverty_df,
|
||||||
|
self.housing_and_transportation_df,
|
||||||
]
|
]
|
||||||
census_tract_df = self._join_tract_dfs(census_tract_dfs)
|
census_tract_df = self._join_tract_dfs(census_tract_dfs)
|
||||||
|
|
||||||
|
|
|
@ -11,7 +11,7 @@ logger = get_module_logger(__name__)
|
||||||
class HousingTransportationETL(ExtractTransformLoad):
|
class HousingTransportationETL(ExtractTransformLoad):
|
||||||
def __init__(self):
|
def __init__(self):
|
||||||
self.HOUSING_FTP_URL = (
|
self.HOUSING_FTP_URL = (
|
||||||
"https://htaindex.cnt.org/download/download.php?focus=blkgrp&geoid="
|
"https://htaindex.cnt.org/download/download.php?focus=tract&geoid="
|
||||||
)
|
)
|
||||||
self.OUTPUT_PATH = (
|
self.OUTPUT_PATH = (
|
||||||
self.DATA_PATH / "dataset" / "housing_and_transportation_index"
|
self.DATA_PATH / "dataset" / "housing_and_transportation_index"
|
||||||
|
@ -33,7 +33,7 @@ class HousingTransportationETL(ExtractTransformLoad):
|
||||||
|
|
||||||
# New file name:
|
# New file name:
|
||||||
tmp_csv_file_path = (
|
tmp_csv_file_path = (
|
||||||
zip_file_dir / f"htaindex_data_blkgrps_{fips}.csv"
|
zip_file_dir / f"htaindex_data_tracts_{fips}.csv"
|
||||||
)
|
)
|
||||||
|
|
||||||
try:
|
try:
|
||||||
|
@ -50,10 +50,10 @@ class HousingTransportationETL(ExtractTransformLoad):
|
||||||
def transform(self) -> None:
|
def transform(self) -> None:
|
||||||
logger.info("Transforming Housing and Transportation Data")
|
logger.info("Transforming Housing and Transportation Data")
|
||||||
|
|
||||||
# Rename and reformat block group ID
|
# Rename and reformat tract ID
|
||||||
self.df.rename(columns={"blkgrp": self.GEOID_FIELD_NAME}, inplace=True)
|
self.df.rename(columns={"tract": self.GEOID_TRACT_FIELD_NAME}, inplace=True)
|
||||||
self.df[self.GEOID_FIELD_NAME] = self.df[
|
self.df[self.GEOID_TRACT_FIELD_NAME] = self.df[
|
||||||
self.GEOID_FIELD_NAME
|
self.GEOID_TRACT_FIELD_NAME
|
||||||
].str.replace('"', "")
|
].str.replace('"', "")
|
||||||
|
|
||||||
def load(self) -> None:
|
def load(self) -> None:
|
||||||
|
|
Loading…
Add table
Reference in a new issue