diff --git a/data/data-pipeline/data_pipeline/content/config/csv.yml b/data/data-pipeline/data_pipeline/content/config/csv.yml index 41fb7981..93c96a06 100644 --- a/data/data-pipeline/data_pipeline/content/config/csv.yml +++ b/data/data-pipeline/data_pipeline/content/config/csv.yml @@ -74,6 +74,9 @@ fields: - score_name: Is low income (imputed and adjusted)? label: Is low income? format: bool +- score_name: Income data has been estimated based on neighbor income + label: Income data has been estimated based on geographic neighbor income + format: bool - score_name: Greater than or equal to the 90th percentile for expected agriculture loss rate and is low income? label: Greater than or equal to the 90th percentile for expected agriculture loss rate and is low income? format: bool @@ -101,6 +104,30 @@ fields: - score_name: Expected population loss rate (Natural Hazards Risk Index) label: Expected population loss rate (Natural Hazards Risk Index) format: loss_rate_percentage +- score_name: Share of properties at risk of flood in 30 years (percentile) + label: Share of properties at risk of flood in 30 years (percentile) + format: percentage +- score_name: Share of properties at risk of flood in 30 years + label: Share of properties at risk of flood in 30 years + format: percentage +- score_name: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years + label: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years + format: bool +- score_name: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years and is low income? + label: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years and is low income? + format: bool +- score_name: Share of properties at risk of fire in 30 years (percentile) + label: Share of properties at risk of fire in 30 years (percentile) + format: percentage +- score_name: Share of properties at risk of fire in 30 years + label: Share of properties at risk of fire in 30 years + format: percentage +- score_name: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years + label: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years + format: bool +- score_name: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years and is low income? + label: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years and is low income? + format: bool - score_name: Greater than or equal to the 90th percentile for energy burden and is low income? label: Greater than or equal to the 90th percentile for energy burden and is low income? format: bool @@ -137,6 +164,12 @@ fields: - score_name: Traffic proximity and volume label: Traffic proximity and volume format: float +- score_name: Greater than or equal to the 90th percentile for DOT transit barriers and is low income? + label: Greater than or equal to the 90th percentile for DOT transit barriers and is low income? + format: bool +- score_name: DOT Travel Barriers Score (percentile) + label: DOT Travel Barriers Score (percentile) + format: percentage - score_name: Greater than or equal to the 90th percentile for housing burden and is low income? label: Greater than or equal to the 90th percentile for housing burden and is low income? format: bool @@ -161,6 +194,33 @@ fields: - score_name: Median value ($) of owner-occupied housing units label: Median value ($) of owner-occupied housing units format: float +- score_name: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent and is low income? + label: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent and is low income? + format: bool +- score_name: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent + label: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent + format: bool +- score_name: Share of the tract's land area that is covered by impervious surface or cropland as a percent + label: Share of the tract's land area that is covered by impervious surface or cropland as a percent + format: percentage +- score_name: Share of the tract's land area that is covered by impervious surface or cropland as a percent (percentile) + label: Share of the tract's land area that is covered by impervious surface or cropland as a percent (percentile) + format: percentage +- score_name: Does the tract have at least 35 acres in it? + label: Does the tract have at least 35 acres in it? + format: bool +- score_name: Tract-level redlining score meets or exceeds 3.25 and is low income + label: Tract experienced historic underinvestment and remains low income + format: bool +- score_name: Tract-level redlining score meets or exceeds 3.25 + label: Tract experienced historic underinvestment + format: bool +- score_name: Share of homes with no kitchen or indoor plumbing (percent) (percentile) + label: Share of homes with no kitchen or indoor plumbing (percentile) + format: float +- score_name: Share of homes with no kitchen or indoor plumbing (percent) + label: Share of homes with no kitchen or indoor plumbing (percent) + format: float - score_name: Greater than or equal to the 90th percentile for proximity to hazardous waste facilities and is low income? label: Greater than or equal to the 90th percentile for proximity to hazardous waste facilities and is low income? format: bool @@ -188,21 +248,39 @@ fields: - score_name: Proximity to Risk Management Plan (RMP) facilities label: Proximity to Risk Management Plan (RMP) facilities format: float +- score_name: Is there at least one Formerly Used Defense Site (FUDS) in the tract? + label: Is there at least one Formerly Used Defense Site (FUDS) in the tract? + format: bool +- score_name: Is there at least one abandoned mine in this census tract? + label: Is there at least one abandoned mine in this census tract? + format: bool +- score_name: There is at least one abandoned mine in this census tract and the tract is low income. + label: There is at least one abandoned mine in this census tract and the tract is low income. + format: bool +- score_name: There is at least one Formerly Used Defense Site (FUDS) in the tract and the tract is low income. + label: There is at least one Formerly Used Defense Site (FUDS) in the tract and the tract is low income. + format: bool +- score_name: Is there at least one Formerly Used Defense Site (FUDS) in the tract, where missing data is treated as False? + label: Is there at least one Formerly Used Defense Site (FUDS) in the tract, where missing data is treated as False? + format: bool +- score_name: Is there at least one abandoned mine in this census tract, where missing data is treated as False? + label: Is there at least one abandoned mine in this census tract, where missing data is treated as False? + format: bool - score_name: Greater than or equal to the 90th percentile for wastewater discharge and is low income? label: Greater than or equal to the 90th percentile for wastewater discharge and is low income? format: bool -- score_name: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income? - label: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income? - format: bool - score_name: Wastewater discharge (percentile) label: Wastewater discharge (percentile) format: percentage -- score_name: Leaky underground storage tanks (percentile) - label: Leaky underground storage tanks (percentile) - format: percentage - score_name: Wastewater discharge label: Wastewater discharge format: float +- score_name: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income? + label: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income? + format: bool +- score_name: Leaky underground storage tanks (percentile) + label: Leaky underground storage tanks (percentile) + format: percentage - score_name: Leaky underground storage tanks label: Leaky underground storage tanks format: float @@ -296,12 +374,6 @@ fields: - score_name: Unemployment (percent) in 2009 (island areas) and 2010 (states and PR) label: Unemployment (percent) in 2009 (island areas) and 2010 (states and PR) format: percentage -- score_name: Greater than or equal to the 90th percentile for DOT transit barriers and is low income? - label: Greater than or equal to the 90th percentile for DOT transit barriers and is low income? - format: bool -- score_name: DOT Travel Barriers Score (percentile) - label: DOT Travel Barriers Score (percentile) - format: percentage - score_name: Percentage households below 100% of federal poverty line in 2009 (island areas) and 2010 (states and PR) label: Percentage households below 100% of federal poverty line in 2009 (island areas) and 2010 (states and PR) format: percentage @@ -314,72 +386,6 @@ fields: - score_name: Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS education in 2009 (island areas)? label: Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS education in 2009 (island areas)? format: bool -- score_name: Share of properties at risk of flood in 30 years - label: Share of properties at risk of flood in 30 years - format: percentage -- score_name: Share of properties at risk of fire in 30 years - label: Share of properties at risk of fire in 30 years - format: percentage -- score_name: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years and is low income? - label: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years and is low income? - format: bool -- score_name: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years and is low income? - label: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years and is low income? - format: bool -- score_name: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years - label: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years - format: bool -- score_name: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years - label: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years - format: bool -- score_name: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent and is low income? - label: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent and is low income? - format: bool -- score_name: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent - label: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent - format: bool -- score_name: Share of the tract's land area that is covered by impervious surface or cropland as a percent - label: Share of the tract's land area that is covered by impervious surface or cropland as a percent - format: percentage -- score_name: Share of the tract's land area that is covered by impervious surface or cropland as a percent (percentile) - label: Share of the tract's land area that is covered by impervious surface or cropland as a percent (percentile) - format: percentage -- score_name: Share of properties at risk of flood in 30 years (percentile) - label: Share of properties at risk of flood in 30 years (percentile) - format: percentage -- score_name: Share of properties at risk of fire in 30 years (percentile) - label: Share of properties at risk of fire in 30 years (percentile) - format: percentage -- score_name: Does the tract have at least 35 acres in it? - label: Does the tract have at least 35 acres in it? - format: bool -- score_name: Is there at least one Formerly Used Defense Site (FUDS) in the tract? - label: Is there at least one Formerly Used Defense Site (FUDS) in the tract? - format: bool -- score_name: Is there at least one abandoned mine in this census tract? - label: Is there at least one abandoned mine in this census tract? - format: bool -- score_name: Is there at least one Formerly Used Defense Site (FUDS) in the tract, where missing data is treated as False? - label: Is there at least one Formerly Used Defense Site (FUDS) in the tract, where missing data is treated as False? - format: bool -- score_name: Is there at least one abandoned mine in this census tract, where missing data is treated as False? - label: Is there at least one abandoned mine in this census tract, where missing data is treated as False? - format: bool -- score_name: There is at least one abandoned mine in this census tract and the tract is low income. - label: There is at least one abandoned mine in this census tract and the tract is low income. - format: bool -- score_name: There is at least one Formerly Used Defense Site (FUDS) in the tract and the tract is low income. - label: There is at least one Formerly Used Defense Site (FUDS) in the tract and the tract is low income. - format: bool -- score_name: Tract-level redlining score meets or exceeds 3.25 and is low income - label: Tract experienced historic underinvestment and remains low income - format: bool -- score_name: Tract-level redlining score meets or exceeds 3.25 - label: Tract experienced historic underinvestment - format: bool -- score_name: Income data has been estimated based on neighbor income - label: Income data has been estimated based on geographic neighbor income - format: bool - score_name: Number of Tribal areas within Census tract label: Number of Tribal areas within Census tract format: int64 diff --git a/data/data-pipeline/data_pipeline/content/config/excel.yml b/data/data-pipeline/data_pipeline/content/config/excel.yml index 2b69cef3..34b89dee 100644 --- a/data/data-pipeline/data_pipeline/content/config/excel.yml +++ b/data/data-pipeline/data_pipeline/content/config/excel.yml @@ -78,6 +78,9 @@ sheets: - score_name: Is low income (imputed and adjusted)? label: Is low income? format: bool + - score_name: Income data has been estimated based on neighbor income + label: Income data has been estimated based on geographic neighbor income + format: bool - score_name: Greater than or equal to the 90th percentile for expected agriculture loss rate and is low income? label: Greater than or equal to the 90th percentile for expected agriculture loss rate and is low income? format: bool @@ -105,6 +108,30 @@ sheets: - score_name: Expected population loss rate (Natural Hazards Risk Index) label: Expected population loss rate (Natural Hazards Risk Index) format: loss_rate_percentage + - score_name: Share of properties at risk of flood in 30 years (percentile) + label: Share of properties at risk of flood in 30 years (percentile) + format: percentage + - score_name: Share of properties at risk of flood in 30 years + label: Share of properties at risk of flood in 30 years + format: percentage + - score_name: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years + label: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years + format: bool + - score_name: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years and is low income? + label: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years and is low income? + format: bool + - score_name: Share of properties at risk of fire in 30 years (percentile) + label: Share of properties at risk of fire in 30 years (percentile) + format: percentage + - score_name: Share of properties at risk of fire in 30 years + label: Share of properties at risk of fire in 30 years + format: percentage + - score_name: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years + label: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years + format: bool + - score_name: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years and is low income? + label: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years and is low income? + format: bool - score_name: Greater than or equal to the 90th percentile for energy burden and is low income? label: Greater than or equal to the 90th percentile for energy burden and is low income? format: bool @@ -141,6 +168,12 @@ sheets: - score_name: Traffic proximity and volume label: Traffic proximity and volume format: float + - score_name: Greater than or equal to the 90th percentile for DOT transit barriers and is low income? + label: Greater than or equal to the 90th percentile for DOT transit barriers and is low income? + format: bool + - score_name: DOT Travel Barriers Score (percentile) + label: DOT Travel Barriers Score (percentile) + format: percentage - score_name: Greater than or equal to the 90th percentile for housing burden and is low income? label: Greater than or equal to the 90th percentile for housing burden and is low income? format: bool @@ -165,6 +198,33 @@ sheets: - score_name: Median value ($) of owner-occupied housing units label: Median value ($) of owner-occupied housing units format: float + - score_name: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent and is low income? + label: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent and is low income? + format: bool + - score_name: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent + label: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent + format: bool + - score_name: Share of the tract's land area that is covered by impervious surface or cropland as a percent + label: Share of the tract's land area that is covered by impervious surface or cropland as a percent + format: percentage + - score_name: Share of the tract's land area that is covered by impervious surface or cropland as a percent (percentile) + label: Share of the tract's land area that is covered by impervious surface or cropland as a percent (percentile) + format: percentage + - score_name: Does the tract have at least 35 acres in it? + label: Does the tract have at least 35 acres in it? + format: bool + - score_name: Tract-level redlining score meets or exceeds 3.25 and is low income + label: Tract experienced historic underinvestment and remains low income + format: bool + - score_name: Tract-level redlining score meets or exceeds 3.25 + label: Tract experienced historic underinvestment + format: bool + - score_name: Share of homes with no kitchen or indoor plumbing (percent) (percentile) + label: Share of homes with no kitchen or indoor plumbing (percentile) + format: float + - score_name: Share of homes with no kitchen or indoor plumbing (percent) + label: Share of homes with no kitchen or indoor plumbing (percent) + format: float - score_name: Greater than or equal to the 90th percentile for proximity to hazardous waste facilities and is low income? label: Greater than or equal to the 90th percentile for proximity to hazardous waste facilities and is low income? format: bool @@ -192,21 +252,39 @@ sheets: - score_name: Proximity to Risk Management Plan (RMP) facilities label: Proximity to Risk Management Plan (RMP) facilities format: float + - score_name: Is there at least one Formerly Used Defense Site (FUDS) in the tract? + label: Is there at least one Formerly Used Defense Site (FUDS) in the tract? + format: bool + - score_name: Is there at least one abandoned mine in this census tract? + label: Is there at least one abandoned mine in this census tract? + format: bool + - score_name: There is at least one abandoned mine in this census tract and the tract is low income. + label: There is at least one abandoned mine in this census tract and the tract is low income. + format: bool + - score_name: There is at least one Formerly Used Defense Site (FUDS) in the tract and the tract is low income. + label: There is at least one Formerly Used Defense Site (FUDS) in the tract and the tract is low income. + format: bool + - score_name: Is there at least one Formerly Used Defense Site (FUDS) in the tract, where missing data is treated as False? + label: Is there at least one Formerly Used Defense Site (FUDS) in the tract, where missing data is treated as False? + format: bool + - score_name: Is there at least one abandoned mine in this census tract, where missing data is treated as False? + label: Is there at least one abandoned mine in this census tract, where missing data is treated as False? + format: bool - score_name: Greater than or equal to the 90th percentile for wastewater discharge and is low income? label: Greater than or equal to the 90th percentile for wastewater discharge and is low income? format: bool - - score_name: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income? - label: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income? - format: bool - score_name: Wastewater discharge (percentile) label: Wastewater discharge (percentile) format: percentage - - score_name: Leaky underground storage tanks (percentile) - label: Leaky underground storage tanks (percentile) - format: percentage - score_name: Wastewater discharge label: Wastewater discharge format: float + - score_name: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income? + label: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income? + format: bool + - score_name: Leaky underground storage tanks (percentile) + label: Leaky underground storage tanks (percentile) + format: percentage - score_name: Leaky underground storage tanks label: Leaky underground storage tanks format: float @@ -300,12 +378,6 @@ sheets: - score_name: Unemployment (percent) in 2009 (island areas) and 2010 (states and PR) label: Unemployment (percent) in 2009 (island areas) and 2010 (states and PR) format: percentage - - score_name: Greater than or equal to the 90th percentile for DOT transit barriers and is low income? - label: Greater than or equal to the 90th percentile for DOT transit barriers and is low income? - format: bool - - score_name: DOT Travel Barriers Score (percentile) - label: DOT Travel Barriers Score (percentile) - format: percentage - score_name: Percentage households below 100% of federal poverty line in 2009 (island areas) and 2010 (states and PR) label: Percentage households below 100% of federal poverty line in 2009 (island areas) and 2010 (states and PR) format: percentage @@ -318,72 +390,6 @@ sheets: - score_name: Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS education in 2009 (island areas)? label: Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS education in 2009 (island areas)? format: bool - - score_name: Share of properties at risk of flood in 30 years - label: Share of properties at risk of flood in 30 years - format: percentage - - score_name: Share of properties at risk of fire in 30 years - label: Share of properties at risk of fire in 30 years - format: percentage - - score_name: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years and is low income? - label: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years and is low income? - format: bool - - score_name: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years and is low income? - label: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years and is low income? - format: bool - - score_name: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years - label: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years - format: bool - - score_name: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years - label: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years - format: bool - - score_name: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent and is low income? - label: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent and is low income? - format: bool - - score_name: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent - label: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent - format: bool - - score_name: Share of the tract's land area that is covered by impervious surface or cropland as a percent - label: Share of the tract's land area that is covered by impervious surface or cropland as a percent - format: percentage - - score_name: Share of the tract's land area that is covered by impervious surface or cropland as a percent (percentile) - label: Share of the tract's land area that is covered by impervious surface or cropland as a percent (percentile) - format: percentage - - score_name: Share of properties at risk of flood in 30 years (percentile) - label: Share of properties at risk of flood in 30 years (percentile) - format: percentage - - score_name: Share of properties at risk of fire in 30 years (percentile) - label: Share of properties at risk of fire in 30 years (percentile) - format: percentage - - score_name: Does the tract have at least 35 acres in it? - label: Does the tract have at least 35 acres in it? - format: bool - - score_name: Is there at least one Formerly Used Defense Site (FUDS) in the tract? - label: Is there at least one Formerly Used Defense Site (FUDS) in the tract? - format: bool - - score_name: Is there at least one abandoned mine in this census tract? - label: Is there at least one abandoned mine in this census tract? - format: bool - - score_name: There is at least one abandoned mine in this census tract and the tract is low income. - label: There is at least one abandoned mine in this census tract and the tract is low income. - format: bool - - score_name: There is at least one Formerly Used Defense Site (FUDS) in the tract and the tract is low income. - label: There is at least one Formerly Used Defense Site (FUDS) in the tract and the tract is low income. - format: bool - - score_name: Is there at least one Formerly Used Defense Site (FUDS) in the tract, where missing data is treated as False? - label: Is there at least one Formerly Used Defense Site (FUDS) in the tract, where missing data is treated as False? - format: bool - - score_name: Is there at least one abandoned mine in this census tract, where missing data is treated as False? - label: Is there at least one abandoned mine in this census tract, where missing data is treated as False? - format: bool - - score_name: Tract-level redlining score meets or exceeds 3.25 and is low income - label: Tract experienced historic underinvestment and remains low income - format: bool - - score_name: Tract-level redlining score meets or exceeds 3.25 - label: Tract experienced historic underinvestment - format: bool - - score_name: Income data has been estimated based on neighbor income - label: Income data has been estimated based on geographic neighbor income - format: bool - score_name: Number of Tribal areas within Census tract label: Number of Tribal areas within Census tract format: int64 diff --git a/data/data-pipeline/data_pipeline/etl/score/tests/snapshots/downloadable_data_expected.pkl b/data/data-pipeline/data_pipeline/etl/score/tests/snapshots/downloadable_data_expected.pkl index 6547f46d..900f1143 100644 Binary files a/data/data-pipeline/data_pipeline/etl/score/tests/snapshots/downloadable_data_expected.pkl and b/data/data-pipeline/data_pipeline/etl/score/tests/snapshots/downloadable_data_expected.pkl differ