mirror of
https://github.com/DOI-DO/j40-cejst-2.git
synced 2025-07-28 14:31:16 -07:00
adding median income field and running black
This commit is contained in:
parent
6c986adfe4
commit
4ae7eff4c4
6 changed files with 33 additions and 10 deletions
|
@ -22,6 +22,8 @@ class CensusACSETL(ExtractTransformLoad):
|
|||
"C16002_010E",
|
||||
"C16002_013E",
|
||||
]
|
||||
self.MEDIAN_INCOME_FIELD = "B19013_001E"
|
||||
self.MEDIAN_INCOME_FIELD_NAME = "Median household income in the past 12 months"
|
||||
self.df: pd.DataFrame
|
||||
|
||||
def _fips_from_censusdata_censusgeo(self, censusgeo: censusdata.censusgeo) -> str:
|
||||
|
@ -45,6 +47,7 @@ class CensusACSETL(ExtractTransformLoad):
|
|||
# Emploment fields
|
||||
"B23025_005E",
|
||||
"B23025_003E",
|
||||
self.MEDIAN_INCOME_FIELD,
|
||||
]
|
||||
+ self.LINGUISTIC_ISOLATION_FIELDS,
|
||||
)
|
||||
|
@ -59,6 +62,9 @@ class CensusACSETL(ExtractTransformLoad):
|
|||
def transform(self) -> None:
|
||||
logger.info("Starting Census ACS Transform")
|
||||
|
||||
# Rename median income
|
||||
self.df[self.MEDIAN_INCOME_FIELD_NAME] = self.df[self.MEDIAN_INCOME_FIELD]
|
||||
|
||||
# Calculate percent unemployment.
|
||||
# TODO: remove small-sample data that should be `None` instead of a high-variance fraction.
|
||||
self.df[self.UNEMPLOYED_FIELD_NAME] = self.df.B23025_005E / self.df.B23025_003E
|
||||
|
@ -91,6 +97,7 @@ class CensusACSETL(ExtractTransformLoad):
|
|||
self.GEOID_FIELD_NAME,
|
||||
self.UNEMPLOYED_FIELD_NAME,
|
||||
self.LINGUISTIC_ISOLATION_FIELD_NAME,
|
||||
self.MEDIAN_INCOME_FIELD_NAME,
|
||||
]
|
||||
|
||||
self.df[columns_to_include].to_csv(
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue