Updates backend constants to N (#1854)

This commit is contained in:
Emma Nechamkin 2022-08-23 16:19:00 -04:00 committed by GitHub
commit 6418335219
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
15 changed files with 1277 additions and 911 deletions

View file

@ -5,372 +5,372 @@ global_config:
float: 2
loss_rate_percentage: 4
fields:
- score_name: GEOID10_TRACT
label: Census tract ID
format: string
- score_name: County Name
label: County Name
format: string
- score_name: State/Territory
label: State/Territory
format: string
- score_name: Percent Black or African American
label: Percent Black or African American alone
format: float
- score_name: Percent American Indian / Alaska Native
label: Percent American Indian / Alaska Native
format: float
- score_name: Percent Asian
label: Percent Asian
format: float
- score_name: Percent Native Hawaiian or Pacific
label: Percent Native Hawaiian or Pacific
format: float
- score_name: Percent two or more races
label: Percent two or more races
format: float
- score_name: Percent White
label: Percent White
format: float
- score_name: Percent Hispanic or Latino
label: Percent Hispanic or Latino
format: float
- score_name: Percent other races
label: Percent other races
format: float
- score_name: Percent age under 10
label: Percent age under 10
format: float
- score_name: Percent age 10 to 64
label: Percent age 10 to 64
format: float
- score_name: Percent age over 64
label: Percent age over 64
format: float
- score_name: Total threshold criteria exceeded
label: Total threshold criteria exceeded
format: int64
- score_name: Total categories exceeded
label: Total categories exceeded
format: int64
- score_name: Definition N (communities)
label: Identified as disadvantaged without considering neighbors
format: bool
- score_name: Definition N (communities) (based on adjacency index and low income alone)
label: Identified as disadvantaged based on neighbors and relaxed low income threshold only
format: bool
- score_name: Definition M community, including adjacency index tracts
label: Identified as disadvantaged
format: bool
- score_name: Definition N (communities) (average of neighbors)
label: Share of neighbors that are identified as disadvantaged
format: percentage
- score_name: Total population
label: Total population
format: float
- score_name: Percent of individuals below 200% Federal Poverty Line, imputed and adjusted
label: Adjusted percent of individuals below 200% Federal Poverty Line
format: float
- score_name: Is low income and has a low percent of higher ed students?
label: Is low income and high percent of residents that are not higher ed students?
format: bool
- score_name: Greater than or equal to the 90th percentile for expected agriculture loss rate, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for expected agriculture loss rate, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Expected agricultural loss rate (Natural Hazards Risk Index) (percentile)
label: Expected agricultural loss rate (Natural Hazards Risk Index) (percentile)
format: percentage
- score_name: Expected agricultural loss rate (Natural Hazards Risk Index)
label: Expected agricultural loss rate (Natural Hazards Risk Index)
format: loss_rate_percentage
- score_name: Greater than or equal to the 90th percentile for expected building loss rate, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for expected building loss rate, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Expected building loss rate (Natural Hazards Risk Index) (percentile)
label: Expected building loss rate (Natural Hazards Risk Index) (percentile)
format: percentage
- score_name: Expected building loss rate (Natural Hazards Risk Index)
label: Expected building loss rate (Natural Hazards Risk Index)
format: loss_rate_percentage
- score_name: Greater than or equal to the 90th percentile for expected population loss rate, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for expected population loss rate, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Expected population loss rate (Natural Hazards Risk Index) (percentile)
label: Expected population loss rate (Natural Hazards Risk Index) (percentile)
format: percentage
- score_name: Expected population loss rate (Natural Hazards Risk Index)
label: Expected population loss rate (Natural Hazards Risk Index)
format: loss_rate_percentage
- score_name: Greater than or equal to the 90th percentile for energy burden, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for energy burden, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Energy burden (percentile)
label: Energy burden (percentile)
format: percentage
- score_name: Energy burden
label: Energy burden
format: percentage
- score_name: Greater than or equal to the 90th percentile for PM2.5 exposure, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for PM2.5 exposure, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: PM2.5 in the air (percentile)
label: PM2.5 in the air (percentile)
format: percentage
- score_name: PM2.5 in the air
label: PM2.5 in the air
format: float
- score_name: Greater than or equal to the 90th percentile for diesel particulate matter, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for diesel particulate matter, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Diesel particulate matter exposure (percentile)
label: Diesel particulate matter exposure (percentile)
format: percentage
- score_name: Diesel particulate matter exposure
label: Diesel particulate matter exposure
format: float
- score_name: Greater than or equal to the 90th percentile for traffic proximity, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for traffic proximity, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Traffic proximity and volume (percentile)
label: Traffic proximity and volume (percentile)
format: percentage
- score_name: Traffic proximity and volume
label: Traffic proximity and volume
format: float
- score_name: Greater than or equal to the 90th percentile for housing burden, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for housing burden, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Housing burden (percent) (percentile)
label: Housing burden (percent) (percentile)
format: percentage
- score_name: Housing burden (percent)
label: Housing burden (percent)
format: percentage
- score_name: Greater than or equal to the 90th percentile for lead paint, the median house value is less than 90th percentile, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for lead paint, the median house value is less than 90th percentile, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Percent pre-1960s housing (lead paint indicator) (percentile)
label: Percent pre-1960s housing (lead paint indicator) (percentile)
format: percentage
- score_name: Percent pre-1960s housing (lead paint indicator)
label: Percent pre-1960s housing (lead paint indicator)
format: percentage
- score_name: Median value ($) of owner-occupied housing units (percentile)
label: Median value ($) of owner-occupied housing units (percentile)
format: percentage
- score_name: Median value ($) of owner-occupied housing units
label: Median value ($) of owner-occupied housing units
format: float
- score_name: Greater than or equal to the 90th percentile for proximity to hazardous waste facilities, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for proximity to hazardous waste facilities, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Proximity to hazardous waste sites (percentile)
label: Proximity to hazardous waste sites (percentile)
format: percentage
- score_name: Proximity to hazardous waste sites
label: Proximity to hazardous waste sites
format: float
- score_name: Greater than or equal to the 90th percentile for proximity to superfund sites, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for proximity to superfund sites, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Proximity to NPL sites (percentile)
label: Proximity to NPL (Superfund) sites (percentile)
format: percentage
- score_name: Proximity to NPL sites
label: Proximity to NPL (Superfund) sites
format: float
- score_name: Greater than or equal to the 90th percentile for proximity to RMP sites, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for proximity to RMP sites, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Proximity to Risk Management Plan (RMP) facilities (percentile)
label: Proximity to Risk Management Plan (RMP) facilities (percentile)
format: percentage
- score_name: Proximity to Risk Management Plan (RMP) facilities
label: Proximity to Risk Management Plan (RMP) facilities
format: float
- score_name: Greater than or equal to the 90th percentile for wastewater discharge, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for wastewater discharge, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Wastewater discharge (percentile)
label: Wastewater discharge (percentile)
format: percentage
- score_name: Wastewater discharge
label: Wastewater discharge
format: float
- score_name: Greater than or equal to the 90th percentile for asthma, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for asthma, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Current asthma among adults aged greater than or equal to 18 years (percentile)
label: Current asthma among adults aged greater than or equal to 18 years (percentile)
format: percentage
- score_name: Current asthma among adults aged greater than or equal to 18 years
label: Current asthma among adults aged greater than or equal to 18 years
format: percentage
- score_name: Greater than or equal to the 90th percentile for diabetes, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for diabetes, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Diagnosed diabetes among adults aged greater than or equal to 18 years (percentile)
label: Diagnosed diabetes among adults aged greater than or equal to 18 years (percentile)
format: percentage
- score_name: Diagnosed diabetes among adults aged greater than or equal to 18 years
label: Diagnosed diabetes among adults aged greater than or equal to 18 years
format: percentage
- score_name: Greater than or equal to the 90th percentile for heart disease, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for heart disease, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Coronary heart disease among adults aged greater than or equal to 18 years (percentile)
label: Coronary heart disease among adults aged greater than or equal to 18 years (percentile)
format: percentage
- score_name: Coronary heart disease among adults aged greater than or equal to 18 years
label: Coronary heart disease among adults aged greater than or equal to 18 years
format: percentage
- score_name: Greater than or equal to the 90th percentile for low life expectancy, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for low life expectancy, is low income, and high percent of residents that are not higher ed students?
format: bool
- score_name: Low life expectancy (percentile)
label: Low life expectancy (percentile)
format: percentage
- score_name: Life expectancy (years)
label: Life expectancy (years)
format: float
- score_name: Greater than or equal to the 90th percentile for low median household income as a percent of area median income, has low HS attainment, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for low median household income as a percent of area median income, has low HS attainment, and high percent of residents that are not higher ed students?
format: bool
- score_name: Low median household income as a percent of area median income (percentile)
label: Low median household income as a percent of area median income (percentile)
format: percentage
- score_name: Median household income as a percent of area median income
label: Median household income as a percent of area median income
format: percentage
- score_name: Greater than or equal to the 90th percentile for households in linguistic isolation, has low HS attainment, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for households in linguistic isolation, has low HS attainment, and high percent of residents that are not higher ed students?
format: bool
- score_name: Linguistic isolation (percent) (percentile)
label: Linguistic isolation (percent) (percentile)
format: percentage
- score_name: Linguistic isolation (percent)
label: Linguistic isolation (percent)
format: percentage
- score_name: Greater than or equal to the 90th percentile for unemployment, has low HS attainment, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for unemployment, has low HS attainment, and high percent of residents that are not higher ed students?
format: bool
- score_name: Unemployment (percent) (percentile)
label: Unemployment (percent) (percentile)
format: percentage
- score_name: Unemployment (percent)
label: Unemployment (percent)
format: percentage
- score_name: Greater than or equal to the 90th percentile for households at or below 100% federal poverty level, has low HS attainment, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for households at or below 100% federal poverty level, has low HS attainment, and high percent of residents that are not higher ed students?
format: bool
- score_name: Percent of individuals below 200% Federal Poverty Line (percentile)
label: Percent of individuals below 200% Federal Poverty Line (percentile)
format: percentage
- score_name: Percent of individuals below 200% Federal Poverty Line
label: Percent of individuals below 200% Federal Poverty Line
format: percentage
- score_name: Percent of individuals < 100% Federal Poverty Line (percentile)
label: Percent of individuals < 100% Federal Poverty Line (percentile)
format: percentage
- score_name: Percent of individuals < 100% Federal Poverty Line
label: Percent of individuals < 100% Federal Poverty Line
format: percentage
- score_name: Percent individuals age 25 or over with less than high school degree (percentile)
label: Percent individuals age 25 or over with less than high school degree (percentile)
format: percentage
- score_name: Percent individuals age 25 or over with less than high school degree
label: Percent individuals age 25 or over with less than high school degree
format: percentage
- score_name: Unemployment (percent) in 2009 (island areas) and 2010 (states and PR)
label: Unemployment (percent) in 2009 (island areas) and 2010 (states and PR)
format: percentage
- score_name: Percentage households below 100% of federal poverty line in 2009 (island areas) and 2010 (states and PR)
label: Percentage households below 100% of federal poverty line in 2009 (island areas) and 2010 (states and PR)
format: percentage
- score_name: Greater than or equal to the 90th percentile for unemployment and has low HS education in 2009 (island areas)?
label: Greater than or equal to the 90th percentile for unemployment and has low HS education in 2009 (island areas)?
format: bool
- score_name: Greater than or equal to the 90th percentile for households at or below 100% federal poverty level and has low HS education in 2009 (island areas)?
label: Greater than or equal to the 90th percentile for households at or below 100% federal poverty level and has low HS education in 2009 (island areas)?
format: bool
- score_name: Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS education in 2009 (island areas)?
label: Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS education in 2009 (island areas)?
format: bool
- score_name: Percent of population not currently enrolled in college or graduate school
label: Percent of residents who are not currently enrolled in higher ed
format: percentage
- score_name: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income?
label: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income?
format: bool
- score_name: Greater than or equal to the 90th percentile for DOT transit barriers and is low income?
label: Greater than or equal to the 90th percentile for DOT transit barriers and is low income?
format: bool
- score_name: DOT Travel Barriers Score (percentile)
label: DOT Travel Barriers Score (percentile)
format: percentage
- score_name: Leaky underground storage tanks (percentile)
label: Leaky underground storage tanks (percentile)
format: percentage
- score_name: Leaky underground storage tanks
label: Leaky underground storage tanks
format: float
- score_name: Share of properties at risk of flood in 30 years
label: Share of properties at risk of flood in 30 years
format: float
- score_name: Share of properties at risk of fire in 30 years
label: Share of properties at risk of fire in 30 years
format: float
- score_name: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years and is low income?
label: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years and is low income?
format: bool
- score_name: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years and is low income?
label: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years and is low income?
format: bool
- score_name: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years
label: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years
format: bool
- score_name: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years
label: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years
format: bool
- score_name: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent and is low income?
label: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent and is low income?
format: bool
- score_name: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent
label: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent
format: bool
- score_name: Share of the tract's land area that is covered by impervious surface or cropland as a percent
label: Share of the tract's land area that is covered by impervious surface or cropland as a percent
format: percentage
- score_name: Share of the tract's land area that is covered by impervious surface or cropland as a percent (percentile)
label: Share of the tract's land area that is covered by impervious surface or cropland as a percent (percentile)
format: percentage
- score_name: Share of properties at risk of flood in 30 years (percentile)
label: Share of properties at risk of flood in 30 years (percentile)
format: percentage
- score_name: Share of properties at risk of fire in 30 years (percentile)
label: Share of properties at risk of fire in 30 years (percentile)
format: percentage
- score_name: Does the tract have at least 35 acres in it?
label: Does the tract have at least 35 acres in it?
format: bool
- score_name: Is there at least one Formerly Used Defense Site (FUDS) in the tract?
label: Is there at least one Formerly Used Defense Site (FUDS) in the tract?
format: bool
- score_name: Is there at least one abandoned mine in this census tract?
label: Is there at least one abandoned mine in this census tract?
format: bool
- score_name: There is at least one abandoned mine in this census tract and the tract is low income.
label: There is at least one abandoned mine in this census tract and the tract is low income.
format: bool
- score_name: There is at least one Formerly Used Defense Site (FUDS) in the tract and the tract is low income.
label: There is at least one Formerly Used Defense Site (FUDS) in the tract and the tract is low income.
format: bool
- score_name: Tract-level redlining score meets or exceeds 3.25 and is low income
label: Tract experienced historic underinvestment and remains low income
format: bool
- score_name: Tract-level redlining score meets or exceeds 3.25
label: Tract experienced historic underinvestment
format: bool
- score_name: Income data has been estimated based on neighbor income
label: Income data has been estimated based on geographic neighbor income
format: bool
- score_name: GEOID10_TRACT
label: Census tract ID
format: string
- score_name: County Name
label: County Name
format: string
- score_name: State/Territory
label: State/Territory
format: string
- score_name: Percent Black or African American
label: Percent Black or African American alone
format: float
- score_name: Percent American Indian / Alaska Native
label: Percent American Indian / Alaska Native
format: float
- score_name: Percent Asian
label: Percent Asian
format: float
- score_name: Percent Native Hawaiian or Pacific
label: Percent Native Hawaiian or Pacific
format: float
- score_name: Percent two or more races
label: Percent two or more races
format: float
- score_name: Percent White
label: Percent White
format: float
- score_name: Percent Hispanic or Latino
label: Percent Hispanic or Latino
format: float
- score_name: Percent other races
label: Percent other races
format: float
- score_name: Percent age under 10
label: Percent age under 10
format: float
- score_name: Percent age 10 to 64
label: Percent age 10 to 64
format: float
- score_name: Percent age over 64
label: Percent age over 64
format: float
- score_name: Total threshold criteria exceeded
label: Total threshold criteria exceeded
format: int64
- score_name: Total categories exceeded
label: Total categories exceeded
format: int64
- score_name: Definition N (communities)
label: Identified as disadvantaged without considering neighbors
format: bool
- score_name: Definition N (communities) (based on adjacency index and low income alone)
label: Identified as disadvantaged based on neighbors and relaxed low income threshold only
format: bool
- score_name: Definition N community, including adjacency index tracts
label: Identified as disadvantaged
format: bool
- score_name: Definition N (communities) (average of neighbors)
label: Share of neighbors that are identified as disadvantaged
format: percentage
- score_name: Total population
label: Total population
format: float
- score_name: Percent of individuals below 200% Federal Poverty Line, imputed and adjusted
label: Adjusted percent of individuals below 200% Federal Poverty Line
format: float
- score_name: Is low income (imputed and adjusted)?
label: Is low income?
format: bool
- score_name: Greater than or equal to the 90th percentile for expected agriculture loss rate and is low income?
label: Greater than or equal to the 90th percentile for expected agriculture loss rate and is low income?
format: bool
- score_name: Expected agricultural loss rate (Natural Hazards Risk Index) (percentile)
label: Expected agricultural loss rate (Natural Hazards Risk Index) (percentile)
format: percentage
- score_name: Expected agricultural loss rate (Natural Hazards Risk Index)
label: Expected agricultural loss rate (Natural Hazards Risk Index)
format: loss_rate_percentage
- score_name: Greater than or equal to the 90th percentile for expected building loss rate and is low income?
label: Greater than or equal to the 90th percentile for expected building loss rate and is low income?
format: bool
- score_name: Expected building loss rate (Natural Hazards Risk Index) (percentile)
label: Expected building loss rate (Natural Hazards Risk Index) (percentile)
format: percentage
- score_name: Expected building loss rate (Natural Hazards Risk Index)
label: Expected building loss rate (Natural Hazards Risk Index)
format: loss_rate_percentage
- score_name: Greater than or equal to the 90th percentile for expected population loss rate and is low income?
label: Greater than or equal to the 90th percentile for expected population loss rate and is low income?
format: bool
- score_name: Expected population loss rate (Natural Hazards Risk Index) (percentile)
label: Expected population loss rate (Natural Hazards Risk Index) (percentile)
format: percentage
- score_name: Expected population loss rate (Natural Hazards Risk Index)
label: Expected population loss rate (Natural Hazards Risk Index)
format: loss_rate_percentage
- score_name: Greater than or equal to the 90th percentile for energy burden and is low income?
label: Greater than or equal to the 90th percentile for energy burden and is low income?
format: bool
- score_name: Energy burden (percentile)
label: Energy burden (percentile)
format: percentage
- score_name: Energy burden
label: Energy burden
format: percentage
- score_name: Greater than or equal to the 90th percentile for PM2.5 exposure and is low income?
label: Greater than or equal to the 90th percentile for PM2.5 exposure and is low income?
format: bool
- score_name: PM2.5 in the air (percentile)
label: PM2.5 in the air (percentile)
format: percentage
- score_name: PM2.5 in the air
label: PM2.5 in the air
format: float
- score_name: Greater than or equal to the 90th percentile for diesel particulate matter and is low income?
label: Greater than or equal to the 90th percentile for diesel particulate matter and is low income?
format: bool
- score_name: Diesel particulate matter exposure (percentile)
label: Diesel particulate matter exposure (percentile)
format: percentage
- score_name: Diesel particulate matter exposure
label: Diesel particulate matter exposure
format: float
- score_name: Greater than or equal to the 90th percentile for traffic proximity and is low income?
label: Greater than or equal to the 90th percentile for traffic proximity and is low income?
format: bool
- score_name: Traffic proximity and volume (percentile)
label: Traffic proximity and volume (percentile)
format: percentage
- score_name: Traffic proximity and volume
label: Traffic proximity and volume
format: float
- score_name: Greater than or equal to the 90th percentile for housing burden and is low income?
label: Greater than or equal to the 90th percentile for housing burden and is low income?
format: bool
- score_name: Housing burden (percent) (percentile)
label: Housing burden (percent) (percentile)
format: percentage
- score_name: Housing burden (percent)
label: Housing burden (percent)
format: percentage
- score_name: Greater than or equal to the 90th percentile for lead paint and the median house value is less than 90th percentile and is low income?
label: Greater than or equal to the 90th percentile for lead paint, the median house value is less than 90th percentile and is low income?
format: bool
- score_name: Percent pre-1960s housing (lead paint indicator) (percentile)
label: Percent pre-1960s housing (lead paint indicator) (percentile)
format: percentage
- score_name: Percent pre-1960s housing (lead paint indicator)
label: Percent pre-1960s housing (lead paint indicator)
format: percentage
- score_name: Median value ($) of owner-occupied housing units (percentile)
label: Median value ($) of owner-occupied housing units (percentile)
format: percentage
- score_name: Median value ($) of owner-occupied housing units
label: Median value ($) of owner-occupied housing units
format: float
- score_name: Greater than or equal to the 90th percentile for proximity to hazardous waste facilities and is low income?
label: Greater than or equal to the 90th percentile for proximity to hazardous waste facilities and is low income?
format: bool
- score_name: Proximity to hazardous waste sites (percentile)
label: Proximity to hazardous waste sites (percentile)
format: percentage
- score_name: Proximity to hazardous waste sites
label: Proximity to hazardous waste sites
format: float
- score_name: Greater than or equal to the 90th percentile for proximity to superfund sites and is low income?
label: Greater than or equal to the 90th percentile for proximity to superfund sites and is low income?
format: bool
- score_name: Proximity to NPL sites (percentile)
label: Proximity to NPL (Superfund) sites (percentile)
format: percentage
- score_name: Proximity to NPL sites
label: Proximity to NPL (Superfund) sites
format: float
- score_name: Greater than or equal to the 90th percentile for proximity to RMP sites and is low income?
label: Greater than or equal to the 90th percentile for proximity to RMP sites and is low income?
format: bool
- score_name: Proximity to Risk Management Plan (RMP) facilities (percentile)
label: Proximity to Risk Management Plan (RMP) facilities (percentile)
format: percentage
- score_name: Proximity to Risk Management Plan (RMP) facilities
label: Proximity to Risk Management Plan (RMP) facilities
format: float
- score_name: Greater than or equal to the 90th percentile for wastewater discharge and is low income?
label: Greater than or equal to the 90th percentile for wastewater discharge and is low income?
format: bool
- score_name: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income?
label: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income?
format: bool
- score_name: Wastewater discharge (percentile)
label: Wastewater discharge (percentile)
format: percentage
- score_name: Leaky underground storage tanks (percentile)
label: Leaky underground storage tanks (percentile)
format: percentage
- score_name: Wastewater discharge
label: Wastewater discharge
format: float
- score_name: Leaky underground storage tanks
label: Leaky underground storage tanks
format: float
- score_name: Greater than or equal to the 90th percentile for asthma and is low income?
label: Greater than or equal to the 90th percentile for asthma and is low income?
format: bool
- score_name: Current asthma among adults aged greater than or equal to 18 years (percentile)
label: Current asthma among adults aged greater than or equal to 18 years (percentile)
format: percentage
- score_name: Current asthma among adults aged greater than or equal to 18 years
label: Current asthma among adults aged greater than or equal to 18 years
format: percentage
- score_name: Greater than or equal to the 90th percentile for diabetes and is low income?
label: Greater than or equal to the 90th percentile for diabetes and is low income?
format: bool
- score_name: Diagnosed diabetes among adults aged greater than or equal to 18 years (percentile)
label: Diagnosed diabetes among adults aged greater than or equal to 18 years (percentile)
format: percentage
- score_name: Diagnosed diabetes among adults aged greater than or equal to 18 years
label: Diagnosed diabetes among adults aged greater than or equal to 18 years
format: percentage
- score_name: Greater than or equal to the 90th percentile for heart disease and is low income?
label: Greater than or equal to the 90th percentile for heart disease and is low income?
format: bool
- score_name: Coronary heart disease among adults aged greater than or equal to 18 years (percentile)
label: Coronary heart disease among adults aged greater than or equal to 18 years (percentile)
format: percentage
- score_name: Coronary heart disease among adults aged greater than or equal to 18 years
label: Coronary heart disease among adults aged greater than or equal to 18 years
format: percentage
- score_name: Greater than or equal to the 90th percentile for low life expectancy and is low income?
label: Greater than or equal to the 90th percentile for low life expectancy and is low income?
format: bool
- score_name: Low life expectancy (percentile)
label: Low life expectancy (percentile)
format: percentage
- score_name: Life expectancy (years)
label: Life expectancy (years)
format: float
- score_name: Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS attainment?
label: Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS attainment?
format: bool
- score_name: Low median household income as a percent of area median income (percentile)
label: Low median household income as a percent of area median income (percentile)
format: percentage
- score_name: Median household income as a percent of area median income
label: Median household income as a percent of area median income
format: percentage
- score_name: Greater than or equal to the 90th percentile for households in linguistic isolation and has low HS attainment?
label: Greater than or equal to the 90th percentile for households in linguistic isolation and has low HS attainment?
format: bool
- score_name: Linguistic isolation (percent) (percentile)
label: Linguistic isolation (percent) (percentile)
format: percentage
- score_name: Linguistic isolation (percent)
label: Linguistic isolation (percent)
format: percentage
- score_name: Greater than or equal to the 90th percentile for unemployment and has low HS attainment?
label: Greater than or equal to the 90th percentile for unemployment and has low HS attainment?
format: bool
- score_name: Unemployment (percent) (percentile)
label: Unemployment (percent) (percentile)
format: percentage
- score_name: Unemployment (percent)
label: Unemployment (percent)
format: percentage
- score_name: Greater than or equal to the 90th percentile for households at or below 100% federal poverty level and has low HS attainment?
label: Greater than or equal to the 90th percentile for households at or below 100% federal poverty level and has low HS attainment?
format: bool
- score_name: Percent of individuals below 200% Federal Poverty Line (percentile)
label: Percent of individuals below 200% Federal Poverty Line (percentile)
format: percentage
- score_name: Percent of individuals below 200% Federal Poverty Line
label: Percent of individuals below 200% Federal Poverty Line
format: percentage
- score_name: Percent of individuals < 100% Federal Poverty Line (percentile)
label: Percent of individuals < 100% Federal Poverty Line (percentile)
format: percentage
- score_name: Percent of individuals < 100% Federal Poverty Line
label: Percent of individuals < 100% Federal Poverty Line
format: percentage
- score_name: Percent individuals age 25 or over with less than high school degree (percentile)
label: Percent individuals age 25 or over with less than high school degree (percentile)
format: percentage
- score_name: Percent individuals age 25 or over with less than high school degree
label: Percent individuals age 25 or over with less than high school degree
format: percentage
- score_name: Percent of population not currently enrolled in college or graduate school
label: Percent of residents who are not currently enrolled in higher ed
format: percentage
- score_name: Unemployment (percent) in 2009 (island areas) and 2010 (states and PR)
label: Unemployment (percent) in 2009 (island areas) and 2010 (states and PR)
format: percentage
- score_name: Greater than or equal to the 90th percentile for DOT transit barriers and is low income?
label: Greater than or equal to the 90th percentile for DOT transit barriers and is low income?
format: bool
- score_name: DOT Travel Barriers Score (percentile)
label: DOT Travel Barriers Score (percentile)
format: percentage
- score_name: Percentage households below 100% of federal poverty line in 2009 (island areas) and 2010 (states and PR)
label: Percentage households below 100% of federal poverty line in 2009 (island areas) and 2010 (states and PR)
format: percentage
- score_name: Greater than or equal to the 90th percentile for unemployment and has low HS education in 2009 (island areas)?
label: Greater than or equal to the 90th percentile for unemployment and has low HS education in 2009 (island areas)?
format: bool
- score_name: Greater than or equal to the 90th percentile for households at or below 100% federal poverty level and has low HS education in 2009 (island areas)?
label: Greater than or equal to the 90th percentile for households at or below 100% federal poverty level and has low HS education in 2009 (island areas)?
format: bool
- score_name: Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS education in 2009 (island areas)?
label: Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS education in 2009 (island areas)?
format: bool
- score_name: Share of properties at risk of flood in 30 years
label: Share of properties at risk of flood in 30 years
format: percentage
- score_name: Share of properties at risk of fire in 30 years
label: Share of properties at risk of fire in 30 years
format: percentage
- score_name: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years and is low income?
label: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years and is low income?
format: bool
- score_name: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years and is low income?
label: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years and is low income?
format: bool
- score_name: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years
label: Greater than or equal to the 90th percentile for share of properties at risk of flood in 30 years
format: bool
- score_name: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years
label: Greater than or equal to the 90th percentile for share of properties at risk of fire in 30 years
format: bool
- score_name: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent and is low income?
label: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent and is low income?
format: bool
- score_name: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent
label: Greater than or equal to the 90th percentile for share of the tract's land area that is covered by impervious surface or cropland as a percent
format: bool
- score_name: Share of the tract's land area that is covered by impervious surface or cropland as a percent
label: Share of the tract's land area that is covered by impervious surface or cropland as a percent
format: percentage
- score_name: Share of the tract's land area that is covered by impervious surface or cropland as a percent (percentile)
label: Share of the tract's land area that is covered by impervious surface or cropland as a percent (percentile)
format: percentage
- score_name: Share of properties at risk of flood in 30 years (percentile)
label: Share of properties at risk of flood in 30 years (percentile)
format: percentage
- score_name: Share of properties at risk of fire in 30 years (percentile)
label: Share of properties at risk of fire in 30 years (percentile)
format: percentage
- score_name: Does the tract have at least 35 acres in it?
label: Does the tract have at least 35 acres in it?
format: bool
- score_name: Is there at least one Formerly Used Defense Site (FUDS) in the tract?
label: Is there at least one Formerly Used Defense Site (FUDS) in the tract?
format: bool
- score_name: Is there at least one abandoned mine in this census tract?
label: Is there at least one abandoned mine in this census tract?
format: bool
- score_name: There is at least one abandoned mine in this census tract and the tract is low income.
label: There is at least one abandoned mine in this census tract and the tract is low income.
format: bool
- score_name: There is at least one Formerly Used Defense Site (FUDS) in the tract and the tract is low income.
label: There is at least one Formerly Used Defense Site (FUDS) in the tract and the tract is low income.
format: bool
- score_name: Tract-level redlining score meets or exceeds 3.25 and is low income
label: Tract experienced historic underinvestment and remains low income
format: bool
- score_name: Tract-level redlining score meets or exceeds 3.25
label: Tract experienced historic underinvestment
format: bool
- score_name: Income data has been estimated based on neighbor income
label: Income data has been estimated based on geographic neighbor income
format: bool

View file

@ -63,7 +63,7 @@ sheets:
- score_name: Definition N (communities) (based on adjacency index and low income alone)
label: Identified as disadvantaged based on neighbors and relaxed low income threshold only
format: bool
- score_name: Definition M community, including adjacency index tracts
- score_name: Definition N community, including adjacency index tracts
label: Identified as disadvantaged
format: bool
- score_name: Definition N (communities) (average of neighbors)
@ -75,11 +75,11 @@ sheets:
- score_name: Percent of individuals below 200% Federal Poverty Line, imputed and adjusted
label: Adjusted percent of individuals below 200% Federal Poverty Line
format: float
- score_name: Is low income and has a low percent of higher ed students?
label: Is low income and high percent of residents that are not higher ed students?
- score_name: Is low income (imputed and adjusted)?
label: Is low income?
format: bool
- score_name: Greater than or equal to the 90th percentile for expected agriculture loss rate, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for expected agriculture loss rate, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for expected agriculture loss rate and is low income?
label: Greater than or equal to the 90th percentile for expected agriculture loss rate and is low income?
format: bool
- score_name: Expected agricultural loss rate (Natural Hazards Risk Index) (percentile)
label: Expected agricultural loss rate (Natural Hazards Risk Index) (percentile)
@ -87,8 +87,8 @@ sheets:
- score_name: Expected agricultural loss rate (Natural Hazards Risk Index)
label: Expected agricultural loss rate (Natural Hazards Risk Index)
format: loss_rate_percentage
- score_name: Greater than or equal to the 90th percentile for expected building loss rate, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for expected building loss rate, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for expected building loss rate and is low income?
label: Greater than or equal to the 90th percentile for expected building loss rate and is low income?
format: bool
- score_name: Expected building loss rate (Natural Hazards Risk Index) (percentile)
label: Expected building loss rate (Natural Hazards Risk Index) (percentile)
@ -96,8 +96,8 @@ sheets:
- score_name: Expected building loss rate (Natural Hazards Risk Index)
label: Expected building loss rate (Natural Hazards Risk Index)
format: loss_rate_percentage
- score_name: Greater than or equal to the 90th percentile for expected population loss rate, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for expected population loss rate, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for expected population loss rate and is low income?
label: Greater than or equal to the 90th percentile for expected population loss rate and is low income?
format: bool
- score_name: Expected population loss rate (Natural Hazards Risk Index) (percentile)
label: Expected population loss rate (Natural Hazards Risk Index) (percentile)
@ -105,8 +105,8 @@ sheets:
- score_name: Expected population loss rate (Natural Hazards Risk Index)
label: Expected population loss rate (Natural Hazards Risk Index)
format: loss_rate_percentage
- score_name: Greater than or equal to the 90th percentile for energy burden, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for energy burden, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for energy burden and is low income?
label: Greater than or equal to the 90th percentile for energy burden and is low income?
format: bool
- score_name: Energy burden (percentile)
label: Energy burden (percentile)
@ -114,8 +114,8 @@ sheets:
- score_name: Energy burden
label: Energy burden
format: percentage
- score_name: Greater than or equal to the 90th percentile for PM2.5 exposure, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for PM2.5 exposure, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for PM2.5 exposure and is low income?
label: Greater than or equal to the 90th percentile for PM2.5 exposure and is low income?
format: bool
- score_name: PM2.5 in the air (percentile)
label: PM2.5 in the air (percentile)
@ -123,8 +123,8 @@ sheets:
- score_name: PM2.5 in the air
label: PM2.5 in the air
format: float
- score_name: Greater than or equal to the 90th percentile for diesel particulate matter, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for diesel particulate matter, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for diesel particulate matter and is low income?
label: Greater than or equal to the 90th percentile for diesel particulate matter and is low income?
format: bool
- score_name: Diesel particulate matter exposure (percentile)
label: Diesel particulate matter exposure (percentile)
@ -132,8 +132,8 @@ sheets:
- score_name: Diesel particulate matter exposure
label: Diesel particulate matter exposure
format: float
- score_name: Greater than or equal to the 90th percentile for traffic proximity, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for traffic proximity, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for traffic proximity and is low income?
label: Greater than or equal to the 90th percentile for traffic proximity and is low income?
format: bool
- score_name: Traffic proximity and volume (percentile)
label: Traffic proximity and volume (percentile)
@ -141,8 +141,8 @@ sheets:
- score_name: Traffic proximity and volume
label: Traffic proximity and volume
format: float
- score_name: Greater than or equal to the 90th percentile for housing burden, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for housing burden, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for housing burden and is low income?
label: Greater than or equal to the 90th percentile for housing burden and is low income?
format: bool
- score_name: Housing burden (percent) (percentile)
label: Housing burden (percent) (percentile)
@ -150,8 +150,8 @@ sheets:
- score_name: Housing burden (percent)
label: Housing burden (percent)
format: percentage
- score_name: Greater than or equal to the 90th percentile for lead paint, the median house value is less than 90th percentile, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for lead paint, the median house value is less than 90th percentile, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for lead paint and the median house value is less than 90th percentile and is low income?
label: Greater than or equal to the 90th percentile for lead paint, the median house value is less than 90th percentile and is low income?
format: bool
- score_name: Percent pre-1960s housing (lead paint indicator) (percentile)
label: Percent pre-1960s housing (lead paint indicator) (percentile)
@ -165,8 +165,8 @@ sheets:
- score_name: Median value ($) of owner-occupied housing units
label: Median value ($) of owner-occupied housing units
format: float
- score_name: Greater than or equal to the 90th percentile for proximity to hazardous waste facilities, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for proximity to hazardous waste facilities, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for proximity to hazardous waste facilities and is low income?
label: Greater than or equal to the 90th percentile for proximity to hazardous waste facilities and is low income?
format: bool
- score_name: Proximity to hazardous waste sites (percentile)
label: Proximity to hazardous waste sites (percentile)
@ -174,8 +174,8 @@ sheets:
- score_name: Proximity to hazardous waste sites
label: Proximity to hazardous waste sites
format: float
- score_name: Greater than or equal to the 90th percentile for proximity to superfund sites, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for proximity to superfund sites, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for proximity to superfund sites and is low income?
label: Greater than or equal to the 90th percentile for proximity to superfund sites and is low income?
format: bool
- score_name: Proximity to NPL sites (percentile)
label: Proximity to NPL (Superfund) sites (percentile)
@ -183,8 +183,8 @@ sheets:
- score_name: Proximity to NPL sites
label: Proximity to NPL (Superfund) sites
format: float
- score_name: Greater than or equal to the 90th percentile for proximity to RMP sites, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for proximity to RMP sites, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for proximity to RMP sites and is low income?
label: Greater than or equal to the 90th percentile for proximity to RMP sites and is low income?
format: bool
- score_name: Proximity to Risk Management Plan (RMP) facilities (percentile)
label: Proximity to Risk Management Plan (RMP) facilities (percentile)
@ -192,8 +192,8 @@ sheets:
- score_name: Proximity to Risk Management Plan (RMP) facilities
label: Proximity to Risk Management Plan (RMP) facilities
format: float
- score_name: Greater than or equal to the 90th percentile for wastewater discharge, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for wastewater discharge, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for wastewater discharge and is low income?
label: Greater than or equal to the 90th percentile for wastewater discharge and is low income?
format: bool
- score_name: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income?
label: Greater than or equal to the 90th percentile for leaky underground storage tanks and is low income?
@ -210,8 +210,8 @@ sheets:
- score_name: Leaky underground storage tanks
label: Leaky underground storage tanks
format: float
- score_name: Greater than or equal to the 90th percentile for asthma, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for asthma, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for asthma and is low income?
label: Greater than or equal to the 90th percentile for asthma and is low income?
format: bool
- score_name: Current asthma among adults aged greater than or equal to 18 years (percentile)
label: Current asthma among adults aged greater than or equal to 18 years (percentile)
@ -219,8 +219,8 @@ sheets:
- score_name: Current asthma among adults aged greater than or equal to 18 years
label: Current asthma among adults aged greater than or equal to 18 years
format: percentage
- score_name: Greater than or equal to the 90th percentile for diabetes, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for diabetes, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for diabetes and is low income?
label: Greater than or equal to the 90th percentile for diabetes and is low income?
format: bool
- score_name: Diagnosed diabetes among adults aged greater than or equal to 18 years (percentile)
label: Diagnosed diabetes among adults aged greater than or equal to 18 years (percentile)
@ -228,8 +228,8 @@ sheets:
- score_name: Diagnosed diabetes among adults aged greater than or equal to 18 years
label: Diagnosed diabetes among adults aged greater than or equal to 18 years
format: percentage
- score_name: Greater than or equal to the 90th percentile for heart disease, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for heart disease, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for heart disease and is low income?
label: Greater than or equal to the 90th percentile for heart disease and is low income?
format: bool
- score_name: Coronary heart disease among adults aged greater than or equal to 18 years (percentile)
label: Coronary heart disease among adults aged greater than or equal to 18 years (percentile)
@ -237,8 +237,8 @@ sheets:
- score_name: Coronary heart disease among adults aged greater than or equal to 18 years
label: Coronary heart disease among adults aged greater than or equal to 18 years
format: percentage
- score_name: Greater than or equal to the 90th percentile for low life expectancy, is low income, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for low life expectancy, is low income, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for low life expectancy and is low income?
label: Greater than or equal to the 90th percentile for low life expectancy and is low income?
format: bool
- score_name: Low life expectancy (percentile)
label: Low life expectancy (percentile)
@ -246,8 +246,8 @@ sheets:
- score_name: Life expectancy (years)
label: Life expectancy (years)
format: float
- score_name: Greater than or equal to the 90th percentile for low median household income as a percent of area median income, has low HS attainment, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for low median household income as a percent of area median income, has low HS attainment, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS attainment?
label: Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS attainment?
format: bool
- score_name: Low median household income as a percent of area median income (percentile)
label: Low median household income as a percent of area median income (percentile)
@ -255,8 +255,8 @@ sheets:
- score_name: Median household income as a percent of area median income
label: Median household income as a percent of area median income
format: percentage
- score_name: Greater than or equal to the 90th percentile for households in linguistic isolation, has low HS attainment, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for households in linguistic isolation, has low HS attainment, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for households in linguistic isolation and has low HS attainment?
label: Greater than or equal to the 90th percentile for households in linguistic isolation and has low HS attainment?
format: bool
- score_name: Linguistic isolation (percent) (percentile)
label: Linguistic isolation (percent) (percentile)
@ -264,8 +264,8 @@ sheets:
- score_name: Linguistic isolation (percent)
label: Linguistic isolation (percent)
format: percentage
- score_name: Greater than or equal to the 90th percentile for unemployment, has low HS attainment, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for unemployment, has low HS attainment, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for unemployment and has low HS attainment?
label: Greater than or equal to the 90th percentile for unemployment and has low HS attainment?
format: bool
- score_name: Unemployment (percent) (percentile)
label: Unemployment (percent) (percentile)
@ -273,8 +273,8 @@ sheets:
- score_name: Unemployment (percent)
label: Unemployment (percent)
format: percentage
- score_name: Greater than or equal to the 90th percentile for households at or below 100% federal poverty level, has low HS attainment, and has a low percent of higher ed students?
label: Greater than or equal to the 90th percentile for households at or below 100% federal poverty level, has low HS attainment, and high percent of residents that are not higher ed students?
- score_name: Greater than or equal to the 90th percentile for households at or below 100% federal poverty level and has low HS attainment?
label: Greater than or equal to the 90th percentile for households at or below 100% federal poverty level and has low HS attainment?
format: bool
- score_name: Percent of individuals below 200% Federal Poverty Line (percentile)
label: Percent of individuals below 200% Federal Poverty Line (percentile)

View file

@ -0,0 +1,798 @@
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "cf8f39b0-7735-4f7c-9178-61bbf2257951",
"metadata": {},
"outputs": [],
"source": [
"import pandas as pd\n",
"import numpy as np\n",
"\n",
"%load_ext lab_black"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "66639c20-be5e-4bf6-9b58-98338874f7cc",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"'Median value ($) of owner-occupied housing units (percentile)'"
]
},
"execution_count": 2,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"check = pd.read_csv(\n",
" \"/Users/emmausds/j40/data_pipeline/data/score/downloadable/codebook.csv\"\n",
")"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "5e525e4e-6764-4d4d-9119-b4d400ba022f",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>score_name</th>\n",
" <th>csv_field_type</th>\n",
" <th>csv_label</th>\n",
" <th>excel_label</th>\n",
" <th>calculation_notes</th>\n",
" <th>threshold_category</th>\n",
" <th>notes</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>GEOID10_TRACT</td>\n",
" <td>string</td>\n",
" <td>Census tract ID</td>\n",
" <td>Census tract ID</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>County Name</td>\n",
" <td>string</td>\n",
" <td>County Name</td>\n",
" <td>County Name</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>State/Territory</td>\n",
" <td>string</td>\n",
" <td>State/Territory</td>\n",
" <td>State/Territory</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>Total threshold criteria exceeded</td>\n",
" <td>int64</td>\n",
" <td>Total threshold criteria exceeded</td>\n",
" <td>Total threshold criteria exceeded</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Lists out the total number of criteria (where ...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>Definition M (communities)</td>\n",
" <td>bool</td>\n",
" <td>Identified as disadvantaged</td>\n",
" <td>Identified as disadvantaged</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>True / False variable for whether a tract is a...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>77</th>\n",
" <td>Percentage households below 100% of federal po...</td>\n",
" <td>percentage</td>\n",
" <td>Percentage households below 100% of federal po...</td>\n",
" <td>Percentage households below 100% of federal po...</td>\n",
" <td>Because not all data is available for the Nati...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>78</th>\n",
" <td>Greater than or equal to the 90th percentile f...</td>\n",
" <td>bool</td>\n",
" <td>Greater than or equal to the 90th percentile f...</td>\n",
" <td>Greater than or equal to the 90th percentile f...</td>\n",
" <td>Because not all data is available for the Nati...</td>\n",
" <td>training and workforce development</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>79</th>\n",
" <td>Greater than or equal to the 90th percentile f...</td>\n",
" <td>bool</td>\n",
" <td>Greater than or equal to the 90th percentile f...</td>\n",
" <td>Greater than or equal to the 90th percentile f...</td>\n",
" <td>Because not all data is available for the Nati...</td>\n",
" <td>training and workforce development</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>80</th>\n",
" <td>Greater than or equal to the 90th percentile f...</td>\n",
" <td>bool</td>\n",
" <td>Greater than or equal to the 90th percentile f...</td>\n",
" <td>Greater than or equal to the 90th percentile f...</td>\n",
" <td>Because not all data is available for the Nati...</td>\n",
" <td>training and workforce development</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>81</th>\n",
" <td>Percent of population not currently enrolled i...</td>\n",
" <td>percentage</td>\n",
" <td>Percent of residents who are not currently enr...</td>\n",
" <td>Percent of residents who are not currently enr...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>82 rows × 7 columns</p>\n",
"</div>"
],
"text/plain": [
" score_name csv_field_type \\\n",
"0 GEOID10_TRACT string \n",
"1 County Name string \n",
"2 State/Territory string \n",
"3 Total threshold criteria exceeded int64 \n",
"4 Definition M (communities) bool \n",
".. ... ... \n",
"77 Percentage households below 100% of federal po... percentage \n",
"78 Greater than or equal to the 90th percentile f... bool \n",
"79 Greater than or equal to the 90th percentile f... bool \n",
"80 Greater than or equal to the 90th percentile f... bool \n",
"81 Percent of population not currently enrolled i... percentage \n",
"\n",
" csv_label \\\n",
"0 Census tract ID \n",
"1 County Name \n",
"2 State/Territory \n",
"3 Total threshold criteria exceeded \n",
"4 Identified as disadvantaged \n",
".. ... \n",
"77 Percentage households below 100% of federal po... \n",
"78 Greater than or equal to the 90th percentile f... \n",
"79 Greater than or equal to the 90th percentile f... \n",
"80 Greater than or equal to the 90th percentile f... \n",
"81 Percent of residents who are not currently enr... \n",
"\n",
" excel_label \\\n",
"0 Census tract ID \n",
"1 County Name \n",
"2 State/Territory \n",
"3 Total threshold criteria exceeded \n",
"4 Identified as disadvantaged \n",
".. ... \n",
"77 Percentage households below 100% of federal po... \n",
"78 Greater than or equal to the 90th percentile f... \n",
"79 Greater than or equal to the 90th percentile f... \n",
"80 Greater than or equal to the 90th percentile f... \n",
"81 Percent of residents who are not currently enr... \n",
"\n",
" calculation_notes \\\n",
"0 NaN \n",
"1 NaN \n",
"2 NaN \n",
"3 NaN \n",
"4 NaN \n",
".. ... \n",
"77 Because not all data is available for the Nati... \n",
"78 Because not all data is available for the Nati... \n",
"79 Because not all data is available for the Nati... \n",
"80 Because not all data is available for the Nati... \n",
"81 NaN \n",
"\n",
" threshold_category \\\n",
"0 NaN \n",
"1 NaN \n",
"2 NaN \n",
"3 NaN \n",
"4 NaN \n",
".. ... \n",
"77 NaN \n",
"78 training and workforce development \n",
"79 training and workforce development \n",
"80 training and workforce development \n",
"81 NaN \n",
"\n",
" notes \n",
"0 NaN \n",
"1 NaN \n",
"2 NaN \n",
"3 Lists out the total number of criteria (where ... \n",
"4 True / False variable for whether a tract is a... \n",
".. ... \n",
"77 NaN \n",
"78 NaN \n",
"79 NaN \n",
"80 NaN \n",
"81 NaN \n",
"\n",
"[82 rows x 7 columns]"
]
},
"execution_count": 3,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"check"
]
},
{
"cell_type": "code",
"execution_count": 28,
"id": "d86c867a-1a55-4ec0-82a6-040841406236",
"metadata": {},
"outputs": [],
"source": [
"codebook = pd.DataFrame(to_frame_dict)"
]
},
{
"cell_type": "code",
"execution_count": 62,
"id": "6215deaf-b004-4da0-a70b-bc54f636601a",
"metadata": {},
"outputs": [],
"source": [
"details_to_merge = pd.DataFrame(mapping_dictionary)"
]
},
{
"cell_type": "code",
"execution_count": 69,
"id": "ac4e65c2-09e6-4978-9440-37b3be057f65",
"metadata": {},
"outputs": [],
"source": [
"shapefile_codes = pd.read_csv(\n",
" \"/Users/emmausds/j40/data_pipeline/data/score/shapefile/columns.csv\"\n",
")"
]
},
{
"cell_type": "code",
"execution_count": 153,
"id": "31cfd9ec-5f5f-4642-a51f-6875c2c279a4",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"['Expected agricultural loss rate (Natural Hazards Risk Index) (percentile)',\n",
" 'Expected building loss rate (Natural Hazards Risk Index) (percentile)',\n",
" 'Expected population loss rate (Natural Hazards Risk Index) (percentile)',\n",
" 'Energy burden (percentile)',\n",
" 'PM2.5 in the air (percentile)',\n",
" 'Diesel particulate matter exposure (percentile)',\n",
" 'Traffic proximity and volume (percentile)',\n",
" 'Housing burden (percent) (percentile)',\n",
" 'Percent pre-1960s housing (lead paint indicator) (percentile)',\n",
" 'Median value ($) of owner-occupied housing units (percentile)',\n",
" 'Proximity to hazardous waste sites (percentile)',\n",
" 'Proximity to NPL sites (percentile)',\n",
" 'Proximity to Risk Management Plan (RMP) facilities (percentile)',\n",
" 'Wastewater discharge (percentile)',\n",
" 'Current asthma among adults aged greater than or equal to 18 years (percentile)',\n",
" 'Diagnosed diabetes among adults aged greater than or equal to 18 years (percentile)',\n",
" 'Coronary heart disease among adults aged greater than or equal to 18 years (percentile)',\n",
" 'Low life expectancy (percentile)',\n",
" 'Low median household income as a percent of area median income (percentile)',\n",
" 'Linguistic isolation (percent) (percentile)',\n",
" 'Unemployment (percent) (percentile)',\n",
" 'Percent of individuals below 200% Federal Poverty Line (percentile)',\n",
" 'Percent of individuals < 100% Federal Poverty Line (percentile)',\n",
" 'Percent individuals age 25 or over with less than high school degree (percentile)',\n",
" 'Definition M (percentile)',\n",
" 'Low median household income as a percent of territory median income in 2009 (percentile)',\n",
" 'Percentage households below 100% of federal poverty line in 2009 for island areas (percentile)',\n",
" 'Unemployment (percent) in 2009 for island areas (percentile)']"
]
},
"execution_count": 153,
"metadata": {},
"output_type": "execute_result"
}
],
"source": []
},
{
"cell_type": "code",
"execution_count": 154,
"id": "66dde4fc-48e6-4bdf-b3a6-16c766e94d8a",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
" - column_name: Expected agricultural loss rate (Natural Hazards Risk Index) (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Expected building loss rate (Natural Hazards Risk Index) (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Expected population loss rate (Natural Hazards Risk Index) (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Energy burden (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: PM2.5 in the air (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Diesel particulate matter exposure (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Traffic proximity and volume (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Housing burden (percent) (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Percent pre-1960s housing (lead paint indicator) (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Median value ($) of owner-occupied housing units (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Proximity to hazardous waste sites (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Proximity to NPL sites (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Proximity to Risk Management Plan (RMP) facilities (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Wastewater discharge (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Current asthma among adults aged greater than or equal to 18 years (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Diagnosed diabetes among adults aged greater than or equal to 18 years (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Coronary heart disease among adults aged greater than or equal to 18 years (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Low life expectancy (percentile)\n",
" notes: (1) this percentile is reversed, meaning the lowest raw numbers become the highest percentiles, and (2) all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Low median household income as a percent of area median income (percentile)\n",
" notes: (1) this percentile is reversed, meaning the lowest raw numbers become the highest percentiles, and (2) all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Linguistic isolation (percent) (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Unemployment (percent) (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Percent of individuals below 200% Federal Poverty Line (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Percent of individuals < 100% Federal Poverty Line (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Percent individuals age 25 or over with less than high school degree (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Definition M (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Low median household income as a percent of territory median income in 2009 (percentile)\n",
" notes: (1) this percentile is reversed, meaning the lowest raw numbers become the highest percentiles, and (2) all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Percentage households below 100% of federal poverty line in 2009 for island areas (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n",
" - column_name: Unemployment (percent) in 2009 for island areas (percentile)\n",
" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\n"
]
}
],
"source": [
"for col in [col for col in download_codebook.index.to_list() if \"(percentile)\" in col]:\n",
" print(f\" - column_name: {col}\")\n",
" if \"Low\" not in col:\n",
" print(\n",
" f\" notes: all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\"\n",
" )\n",
" else:\n",
" print(\n",
" f\" notes: (1) this percentile is reversed, meaning the lowest raw numbers become the highest percentiles, and (2) all percentiles are floored (rounded down to the nearest percentile). For example, 89.7th percentile is rounded down to 89 for this field.\"\n",
" )"
]
},
{
"cell_type": "code",
"execution_count": 143,
"id": "5c08708e-4ebf-4cfe-8efb-7ee6c7930427",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>excel_label</th>\n",
" <th>format</th>\n",
" <th>shapefile_column</th>\n",
" <th>notes</th>\n",
" <th>category</th>\n",
" </tr>\n",
" <tr>\n",
" <th>score_name</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>GEOID10_TRACT</th>\n",
" <td>Census tract ID</td>\n",
" <td>string</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>County Name</th>\n",
" <td>County Name</td>\n",
" <td>string</td>\n",
" <td>CF</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>State/Territory</th>\n",
" <td>State/Territory</td>\n",
" <td>string</td>\n",
" <td>SF</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>Total threshold criteria exceeded</th>\n",
" <td>Total threshold criteria exceeded</td>\n",
" <td>int64</td>\n",
" <td>TC</td>\n",
" <td>Lists out the total number of criteria (where ...</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>Definition M (communities)</th>\n",
" <td>Identified as disadvantaged</td>\n",
" <td>bool</td>\n",
" <td>SM_C</td>\n",
" <td>True / False variable for whether a tract is a...</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>Unemployment (percent) in 2009 (island areas) and 2010 (states and PR)</th>\n",
" <td>Unemployment (percent) in 2009 (island areas) ...</td>\n",
" <td>percentage</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>Percentage households below 100% of federal poverty line in 2009 (island areas) and 2010 (states and PR)</th>\n",
" <td>Percentage households below 100% of federal po...</td>\n",
" <td>percentage</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>Greater than or equal to the 90th percentile for unemployment and has low HS education in 2009 (island areas)?</th>\n",
" <td>Greater than or equal to the 90th percentile f...</td>\n",
" <td>bool</td>\n",
" <td>IAULHSE</td>\n",
" <td>island area information comes from the dicenni...</td>\n",
" <td>training and workforce development</td>\n",
" </tr>\n",
" <tr>\n",
" <th>Greater than or equal to the 90th percentile for households at or below 100% federal poverty level and has low HS education in 2009 (island areas)?</th>\n",
" <td>Greater than or equal to the 90th percentile f...</td>\n",
" <td>bool</td>\n",
" <td>IAPLHSE</td>\n",
" <td>island area information comes from the dicenni...</td>\n",
" <td>training and workforce development</td>\n",
" </tr>\n",
" <tr>\n",
" <th>Greater than or equal to the 90th percentile for low median household income as a percent of area median income and has low HS education in 2009 (island areas)?</th>\n",
" <td>Greater than or equal to the 90th percentile f...</td>\n",
" <td>bool</td>\n",
" <td>IALMILHSE</td>\n",
" <td>island area information comes from the dicenni...</td>\n",
" <td>training and workforce development</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>82 rows × 5 columns</p>\n",
"</div>"
],
"text/plain": [
" excel_label \\\n",
"score_name \n",
"GEOID10_TRACT Census tract ID \n",
"County Name County Name \n",
"State/Territory State/Territory \n",
"Total threshold criteria exceeded Total threshold criteria exceeded \n",
"Definition M (communities) Identified as disadvantaged \n",
"... ... \n",
"Unemployment (percent) in 2009 (island areas) a... Unemployment (percent) in 2009 (island areas) ... \n",
"Percentage households below 100% of federal pov... Percentage households below 100% of federal po... \n",
"Greater than or equal to the 90th percentile fo... Greater than or equal to the 90th percentile f... \n",
"Greater than or equal to the 90th percentile fo... Greater than or equal to the 90th percentile f... \n",
"Greater than or equal to the 90th percentile fo... Greater than or equal to the 90th percentile f... \n",
"\n",
" format \\\n",
"score_name \n",
"GEOID10_TRACT string \n",
"County Name string \n",
"State/Territory string \n",
"Total threshold criteria exceeded int64 \n",
"Definition M (communities) bool \n",
"... ... \n",
"Unemployment (percent) in 2009 (island areas) a... percentage \n",
"Percentage households below 100% of federal pov... percentage \n",
"Greater than or equal to the 90th percentile fo... bool \n",
"Greater than or equal to the 90th percentile fo... bool \n",
"Greater than or equal to the 90th percentile fo... bool \n",
"\n",
" shapefile_column \\\n",
"score_name \n",
"GEOID10_TRACT NaN \n",
"County Name CF \n",
"State/Territory SF \n",
"Total threshold criteria exceeded TC \n",
"Definition M (communities) SM_C \n",
"... ... \n",
"Unemployment (percent) in 2009 (island areas) a... NaN \n",
"Percentage households below 100% of federal pov... NaN \n",
"Greater than or equal to the 90th percentile fo... IAULHSE \n",
"Greater than or equal to the 90th percentile fo... IAPLHSE \n",
"Greater than or equal to the 90th percentile fo... IALMILHSE \n",
"\n",
" notes \\\n",
"score_name \n",
"GEOID10_TRACT NaN \n",
"County Name NaN \n",
"State/Territory NaN \n",
"Total threshold criteria exceeded Lists out the total number of criteria (where ... \n",
"Definition M (communities) True / False variable for whether a tract is a... \n",
"... ... \n",
"Unemployment (percent) in 2009 (island areas) a... NaN \n",
"Percentage households below 100% of federal pov... NaN \n",
"Greater than or equal to the 90th percentile fo... island area information comes from the dicenni... \n",
"Greater than or equal to the 90th percentile fo... island area information comes from the dicenni... \n",
"Greater than or equal to the 90th percentile fo... island area information comes from the dicenni... \n",
"\n",
" category \n",
"score_name \n",
"GEOID10_TRACT NaN \n",
"County Name NaN \n",
"State/Territory NaN \n",
"Total threshold criteria exceeded NaN \n",
"Definition M (communities) NaN \n",
"... ... \n",
"Unemployment (percent) in 2009 (island areas) a... NaN \n",
"Percentage households below 100% of federal pov... NaN \n",
"Greater than or equal to the 90th percentile fo... training and workforce development \n",
"Greater than or equal to the 90th percentile fo... training and workforce development \n",
"Greater than or equal to the 90th percentile fo... training and workforce development \n",
"\n",
"[82 rows x 5 columns]"
]
},
"execution_count": 143,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"download_codebook.dropna(subset=[\"format\"]).reset_index()[\"score_name\"]"
]
},
{
"cell_type": "code",
"execution_count": 137,
"id": "7139ce5d-db5e-49dd-8bb3-122c7b73b395",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>excel_label</th>\n",
" <th>format</th>\n",
" <th>shapefile_column</th>\n",
" <th>notes</th>\n",
" <th>category</th>\n",
" </tr>\n",
" <tr>\n",
" <th>score_name</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
"Empty DataFrame\n",
"Columns: [excel_label, format, shapefile_column, notes, category]\n",
"Index: []"
]
},
"execution_count": 137,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"download_codebook.loc[\n",
" sum([download_codebook[col] == \"percentile\" for col in [\"format\"]]) > 0\n",
"]"
]
},
{
"cell_type": "code",
"execution_count": 134,
"id": "e31ef01c-b225-48f0-bdf5-1efb8d4ed95c",
"metadata": {},
"outputs": [
{
"ename": "ValueError",
"evalue": "Cannot index with multidimensional key",
"output_type": "error",
"traceback": [
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
"\u001b[0;31mValueError\u001b[0m Traceback (most recent call last)",
"Input \u001b[0;32mIn [134]\u001b[0m, in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0m \u001b[43mdownload_codebook\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mloc\u001b[49m\u001b[43m[\u001b[49m\u001b[43mdownload_codebook\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mfilter\u001b[49m\u001b[43m(\u001b[49m\u001b[43mlike\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43mformat\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m)\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m==\u001b[39;49m\u001b[43m \u001b[49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43mpercentile\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m]\u001b[49m\n",
"File \u001b[0;32m/usr/local/lib/python3.9/site-packages/pandas/core/indexing.py:931\u001b[0m, in \u001b[0;36m_LocationIndexer.__getitem__\u001b[0;34m(self, key)\u001b[0m\n\u001b[1;32m 928\u001b[0m axis \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39maxis \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;241m0\u001b[39m\n\u001b[1;32m 930\u001b[0m maybe_callable \u001b[38;5;241m=\u001b[39m com\u001b[38;5;241m.\u001b[39mapply_if_callable(key, \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mobj)\n\u001b[0;32m--> 931\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_getitem_axis\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmaybe_callable\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43maxis\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43maxis\u001b[49m\u001b[43m)\u001b[49m\n",
"File \u001b[0;32m/usr/local/lib/python3.9/site-packages/pandas/core/indexing.py:1151\u001b[0m, in \u001b[0;36m_LocIndexer._getitem_axis\u001b[0;34m(self, key, axis)\u001b[0m\n\u001b[1;32m 1148\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m (\u001b[38;5;28misinstance\u001b[39m(key, \u001b[38;5;28mtuple\u001b[39m) \u001b[38;5;129;01mand\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(labels, MultiIndex)):\n\u001b[1;32m 1150\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mhasattr\u001b[39m(key, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mndim\u001b[39m\u001b[38;5;124m\"\u001b[39m) \u001b[38;5;129;01mand\u001b[39;00m key\u001b[38;5;241m.\u001b[39mndim \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m1\u001b[39m:\n\u001b[0;32m-> 1151\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mValueError\u001b[39;00m(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mCannot index with multidimensional key\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m 1153\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_getitem_iterable(key, axis\u001b[38;5;241m=\u001b[39maxis)\n\u001b[1;32m 1155\u001b[0m \u001b[38;5;66;03m# nested tuple slicing\u001b[39;00m\n",
"\u001b[0;31mValueError\u001b[0m: Cannot index with multidimensional key"
]
}
],
"source": [
"download_codebook.loc[download_codebook.filter(like=\"format\") == \"percentile\"]"
]
},
{
"cell_type": "code",
"execution_count": 131,
"id": "73268de4-3378-4ac7-bf85-f483a78c3966",
"metadata": {},
"outputs": [],
"source": [
"download_codebook = pd.concat(\n",
" [\n",
" codebook.set_index(\"score_name\"),\n",
" shapefile_codes.rename(\n",
" columns={\"meaning\": \"shapefile_column\", \"column\": \"score_name\"}\n",
" ).set_index(\"score_name\"),\n",
" details_to_merge.set_index(\"score_name\"),\n",
" ],\n",
" axis=1,\n",
")"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "6321ed42-aee6-40fc-8bf8-2a4ce4276eca",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.10"
}
},
"nbformat": 4,
"nbformat_minor": 5
}

View file

@ -198,42 +198,42 @@ TILES_SCORE_COLUMNS = {
field_names.WASTEWATER_FIELD
+ field_names.PERCENTILE_FIELD_SUFFIX: "WF_PFS",
field_names.UST_FIELD + field_names.PERCENTILE_FIELD_SUFFIX: "UST_PFS",
field_names.M_WATER: "M_WTR",
field_names.M_WORKFORCE: "M_WKFC",
field_names.M_CLIMATE: "M_CLT",
field_names.M_ENERGY: "M_ENY",
field_names.M_TRANSPORTATION: "M_TRN",
field_names.M_HOUSING: "M_HSG",
field_names.M_POLLUTION: "M_PLN",
field_names.M_HEALTH: "M_HLTH",
field_names.N_WATER: "N_WTR",
field_names.N_WORKFORCE: "N_WKFC",
field_names.N_CLIMATE: "N_CLT",
field_names.N_ENERGY: "N_ENY",
field_names.N_TRANSPORTATION: "N_TRN",
field_names.N_HOUSING: "N_HSG",
field_names.N_POLLUTION: "N_PLN",
field_names.N_HEALTH: "N_HLTH",
# temporarily update this so that it's the Narwhal score that gets visualized on the map
# The NEW final score value INCLUDES the adjacency index.
field_names.FINAL_SCORE_N_BOOLEAN: "SM_C",
field_names.FINAL_SCORE_N_BOOLEAN: "SN_C",
field_names.SCORE_N_COMMUNITIES
+ field_names.ADJACENT_MEAN_SUFFIX: "SM_DON",
field_names.SCORE_N_COMMUNITIES: "SM_NO_DON",
field_names.EXPECTED_POPULATION_LOSS_RATE_LOW_INCOME_LOW_HIGHER_ED_FIELD: "EPLRLI",
field_names.EXPECTED_AGRICULTURE_LOSS_RATE_LOW_INCOME_LOW_HIGHER_ED_FIELD: "EALRLI",
field_names.EXPECTED_BUILDING_LOSS_RATE_LOW_INCOME_LOW_HIGHER_ED_FIELD: "EBLRLI",
field_names.PM25_EXPOSURE_LOW_INCOME_LOW_HIGHER_ED_FIELD: "PM25LI",
field_names.ENERGY_BURDEN_LOW_INCOME_LOW_HIGHER_ED_FIELD: "EBLI",
field_names.DIESEL_PARTICULATE_MATTER_LOW_INCOME_LOW_HIGHER_ED_FIELD: "DPMLI",
field_names.TRAFFIC_PROXIMITY_LOW_INCOME_LOW_HIGHER_ED_FIELD: "TPLI",
field_names.LEAD_PAINT_MEDIAN_HOUSE_VALUE_LOW_INCOME_LOW_HIGHER_ED_FIELD: "LPMHVLI",
field_names.HOUSING_BURDEN_LOW_INCOME_LOW_HIGHER_ED_FIELD: "HBLI",
field_names.RMP_LOW_INCOME_LOW_HIGHER_ED_FIELD: "RMPLI",
field_names.SUPERFUND_LOW_INCOME_LOW_HIGHER_ED_FIELD: "SFLI",
field_names.HAZARDOUS_WASTE_LOW_INCOME_LOW_HIGHER_ED_FIELD: "HWLI",
field_names.WASTEWATER_DISCHARGE_LOW_INCOME_LOW_HIGHER_ED_FIELD: "WDLI",
+ field_names.ADJACENT_MEAN_SUFFIX: "SN_DON",
field_names.SCORE_N_COMMUNITIES: "SN_NO_DON",
field_names.EXPECTED_POPULATION_LOSS_RATE_LOW_INCOME_FIELD: "EPLRLI",
field_names.EXPECTED_AGRICULTURE_LOSS_RATE_LOW_INCOME_FIELD: "EALRLI",
field_names.EXPECTED_BUILDING_LOSS_RATE_LOW_INCOME_FIELD: "EBLRLI",
field_names.PM25_EXPOSURE_LOW_INCOME_FIELD: "PM25LI",
field_names.ENERGY_BURDEN_LOW_INCOME_FIELD: "EBLI",
field_names.DIESEL_PARTICULATE_MATTER_LOW_INCOME_FIELD: "DPMLI",
field_names.TRAFFIC_PROXIMITY_LOW_INCOME_FIELD: "TPLI",
field_names.LEAD_PAINT_MEDIAN_HOUSE_VALUE_LOW_INCOME_FIELD: "LPMHVLI",
field_names.HOUSING_BURDEN_LOW_INCOME_FIELD: "HBLI",
field_names.RMP_LOW_INCOME_FIELD: "RMPLI",
field_names.SUPERFUND_LOW_INCOME_FIELD: "SFLI",
field_names.HAZARDOUS_WASTE_LOW_INCOME_FIELD: "HWLI",
field_names.WASTEWATER_DISCHARGE_LOW_INCOME_FIELD: "WDLI",
field_names.UST_LOW_INCOME_FIELD: "USTLI",
field_names.DIABETES_LOW_INCOME_LOW_HIGHER_ED_FIELD: "DLI",
field_names.ASTHMA_LOW_INCOME_LOW_HIGHER_ED_FIELD: "ALI",
field_names.HEART_DISEASE_LOW_INCOME_LOW_HIGHER_ED_FIELD: "HDLI",
field_names.LOW_LIFE_EXPECTANCY_LOW_INCOME_LOW_HIGHER_ED_FIELD: "LLELI",
field_names.LINGUISTIC_ISOLATION_LOW_HS_LOW_HIGHER_ED_FIELD: "LILHSE",
field_names.POVERTY_LOW_HS_LOW_HIGHER_ED_FIELD: "PLHSE",
field_names.LOW_MEDIAN_INCOME_LOW_HS_LOW_HIGHER_ED_FIELD: "LMILHSE",
field_names.UNEMPLOYMENT_LOW_HS_LOW_HIGHER_ED_FIELD: "ULHSE",
field_names.DIABETES_LOW_INCOME_FIELD: "DLI",
field_names.ASTHMA_LOW_INCOME_FIELD: "ALI",
field_names.HEART_DISEASE_LOW_INCOME_FIELD: "HDLI",
field_names.LOW_LIFE_EXPECTANCY_LOW_INCOME_FIELD: "LLELI",
field_names.LINGUISTIC_ISOLATION_LOW_HS_EDUCATION_FIELD: "LILHSE",
field_names.POVERTY_LOW_HS_EDUCATION_FIELD: "PLHSE",
field_names.LOW_MEDIAN_INCOME_LOW_HS_EDUCATION_FIELD: "LMILHSE",
field_names.UNEMPLOYMENT_LOW_HS_EDUCATION_FIELD: "ULHSE",
# new booleans only for the environmental factors
field_names.EXPECTED_POPULATION_LOSS_EXCEEDS_PCTILE_THRESHOLD: "EPL_ET",
field_names.EXPECTED_AGRICULTURAL_LOSS_EXCEEDS_PCTILE_THRESHOLD: "EAL_ET",
@ -276,28 +276,24 @@ TILES_SCORE_COLUMNS = {
field_names.CENSUS_DECENNIAL_UNEMPLOYMENT_FIELD_2009
+ field_names.ISLAND_AREAS_PERCENTILE_ADJUSTMENT_FIELD
+ field_names.PERCENTILE_FIELD_SUFFIX: "IAULHSE_PFS",
field_names.LOW_HS_EDUCATION_LOW_HIGHER_ED_FIELD: "LHE",
field_names.LOW_HS_EDUCATION_FIELD: "LHE",
field_names.ISLAND_AREAS_LOW_HS_EDUCATION_FIELD: "IALHE",
# Percentage of HS Degree completion for Islands
field_names.CENSUS_DECENNIAL_HIGH_SCHOOL_ED_FIELD_2009: "IAHSEF",
field_names.COLLEGE_ATTENDANCE_FIELD: "CA",
field_names.COLLEGE_NON_ATTENDANCE_FIELD: "NCA",
# This is logically equivalent to "non-college greater than 80%"
field_names.COLLEGE_ATTENDANCE_LESS_THAN_20_FIELD: "CA_LT20",
# Booleans for the front end about the types of thresholds exceeded
field_names.CLIMATE_THRESHOLD_EXCEEDED: "M_CLT_EOMI",
field_names.ENERGY_THRESHOLD_EXCEEDED: "M_ENY_EOMI",
field_names.TRAFFIC_THRESHOLD_EXCEEDED: "M_TRN_EOMI",
field_names.HOUSING_THREHSOLD_EXCEEDED: "M_HSG_EOMI",
field_names.POLLUTION_THRESHOLD_EXCEEDED: "M_PLN_EOMI",
field_names.WATER_THRESHOLD_EXCEEDED: "M_WTR_EOMI",
field_names.HEALTH_THRESHOLD_EXCEEDED: "M_HLTH_EOMI",
field_names.WORKFORCE_THRESHOLD_EXCEEDED: "M_WKFC_EOMI",
field_names.CLIMATE_THRESHOLD_EXCEEDED: "N_CLT_EOMI",
field_names.ENERGY_THRESHOLD_EXCEEDED: "N_ENY_EOMI",
field_names.TRAFFIC_THRESHOLD_EXCEEDED: "N_TRN_EOMI",
field_names.HOUSING_THREHSOLD_EXCEEDED: "N_HSG_EOMI",
field_names.POLLUTION_THRESHOLD_EXCEEDED: "N_PLN_EOMI",
field_names.WATER_THRESHOLD_EXCEEDED: "N_WTR_EOMI",
field_names.HEALTH_THRESHOLD_EXCEEDED: "N_HLTH_EOMI",
field_names.WORKFORCE_THRESHOLD_EXCEEDED: "N_WKFC_EOMI",
# These are the booleans for socioeconomic indicators
## this measures low income boolean
field_names.FPL_200_SERIES_IMPUTED_AND_ADJUSTED: "FPL200S",
## Low high school for t&wd
field_names.WORKFORCE_SOCIO_INDICATORS_EXCEEDED: "M_WKFC_EBSI",
field_names.WORKFORCE_SOCIO_INDICATORS_EXCEEDED: "N_WKFC_EBSI",
field_names.DOT_BURDEN_PCTILE_THRESHOLD: "TD_ET",
field_names.DOT_TRAVEL_BURDEN_FIELD
+ field_names.PERCENTILE_FIELD_SUFFIX: "TD_PFS",
@ -377,8 +373,6 @@ TILES_SCORE_FLOAT_COLUMNS = [
# Island areas HS degree attainment rate
field_names.CENSUS_DECENNIAL_HIGH_SCHOOL_ED_FIELD_2009,
field_names.WASTEWATER_FIELD + field_names.PERCENTILE_FIELD_SUFFIX,
field_names.COLLEGE_NON_ATTENDANCE_FIELD,
field_names.COLLEGE_ATTENDANCE_FIELD,
field_names.DOT_TRAVEL_BURDEN_FIELD + field_names.PERCENTILE_FIELD_SUFFIX,
field_names.FUTURE_FLOOD_RISK_FIELD + field_names.PERCENTILE_FIELD_SUFFIX,
field_names.FUTURE_WILDFIRE_RISK_FIELD

View file

@ -403,6 +403,7 @@ class ScoreETL(ExtractTransformLoad):
df[field_names.MEDIAN_INCOME_FIELD] / df[field_names.AMI_FIELD]
)
# Donut columns get added later
numeric_columns = [
field_names.HOUSING_BURDEN_FIELD,
field_names.NO_KITCHEN_OR_INDOOR_PLUMBING_FIELD,
@ -477,12 +478,15 @@ class ScoreETL(ExtractTransformLoad):
non_numeric_columns = [
self.GEOID_TRACT_FIELD_NAME,
field_names.PERSISTENT_POVERTY_FIELD,
field_names.HISTORIC_REDLINING_SCORE_EXCEEDED,
field_names.TRACT_ELIGIBLE_FOR_NONNATURAL_THRESHOLD,
field_names.AGRICULTURAL_VALUE_BOOL_FIELD,
field_names.ELIGIBLE_FUDS_BINARY_FIELD_NAME,
]
boolean_columns = [
field_names.AML_BOOLEAN,
field_names.IMPUTED_INCOME_FLAG_FIELD_NAME,
field_names.ELIGIBLE_FUDS_BINARY_FIELD_NAME,
field_names.HISTORIC_REDLINING_SCORE_EXCEEDED,
]
# For some columns, high values are "good", so we want to reverse the percentile
@ -523,6 +527,7 @@ class ScoreETL(ExtractTransformLoad):
non_numeric_columns
+ numeric_columns
+ [rp.field_name for rp in reverse_percentiles]
+ boolean_columns
)
df_copy = df[columns_to_keep].copy()
@ -533,6 +538,10 @@ class ScoreETL(ExtractTransformLoad):
df_copy[numeric_columns] = df_copy[numeric_columns].apply(pd.to_numeric)
# coerce all booleans to bools
for col in boolean_columns:
df_copy[col] = df_copy[col].astype(bool)
# Convert all columns to numeric and do math
# Note that we have a few special conditions here and we handle them explicitly.
# For *Linguistic Isolation*, we do NOT want to include Puerto Rico in the percentile

View file

@ -53,7 +53,7 @@ class GeoScoreETL(ExtractTransformLoad):
self.TARGET_SCORE_SHORT_FIELD = constants.TILES_SCORE_COLUMNS[
field_names.SCORE_N
]
self.TARGET_SCORE_RENAME_TO = "M_SCORE"
self.TARGET_SCORE_RENAME_TO = "SCORE"
# Import the shortened name for tract ("GTF") that's used on the tiles.
self.TRACT_SHORT_FIELD = constants.TILES_SCORE_COLUMNS[

File diff suppressed because one or more lines are too long

View file

@ -1,418 +0,0 @@
{
"cells": [
{
"cell_type": "code",
"execution_count": 54,
"id": "df048f08",
"metadata": {},
"outputs": [],
"source": [
"import geopandas as gpd\n",
"import pathlib"
]
},
{
"cell_type": "code",
"execution_count": 55,
"id": "62366f7d",
"metadata": {},
"outputs": [],
"source": [
"lowJson = pathlib.Path() / 'usa-low.json'\n",
"assert lowJson.exists()\n",
"highJson = pathlib.Path() / 'usa-high.json'\n",
"assert highJson.exists()"
]
},
{
"cell_type": "code",
"execution_count": 50,
"id": "4077ed78",
"metadata": {},
"outputs": [],
"source": [
"gdf = gpd.read_file(highJson)"
]
},
{
"cell_type": "code",
"execution_count": 56,
"id": "d4abfc64",
"metadata": {},
"outputs": [],
"source": [
"gdf['area'] = gdf.apply(lambda row : gpd.GeoSeries(row['geometry']).area, axis = 1)"
]
},
{
"cell_type": "markdown",
"id": "5077d9ef",
"metadata": {},
"source": [
"Add `zlfc` = *zoom level full containment*, This field will indicate the maximum zoom level the user can go up to while still keeping the entire tract in view. Below, we sample a few tracts to get an idea of the relationship between zoom level and area"
]
},
{
"cell_type": "code",
"execution_count": 89,
"id": "a1234574",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>GEOID10</th>\n",
" <th>SF</th>\n",
" <th>CF</th>\n",
" <th>area</th>\n",
" <th>zlfc</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>9846</th>\n",
" <td>02185000200</td>\n",
" <td>Alaska</td>\n",
" <td>North Slope Borough</td>\n",
" <td>53.323702</td>\n",
" <td>4.45</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9937</th>\n",
" <td>02290000100</td>\n",
" <td>Alaska</td>\n",
" <td>Yukon-Koyukuk Census Area</td>\n",
" <td>21.653154</td>\n",
" <td>5.50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9857</th>\n",
" <td>02188000100</td>\n",
" <td>Alaska</td>\n",
" <td>Northwest Arctic Borough</td>\n",
" <td>21.188159</td>\n",
" <td>5.50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9935</th>\n",
" <td>02290000200</td>\n",
" <td>Alaska</td>\n",
" <td>Yukon-Koyukuk Census Area</td>\n",
" <td>20.744770</td>\n",
" <td>5.38</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9934</th>\n",
" <td>02290000300</td>\n",
" <td>Alaska</td>\n",
" <td>Yukon-Koyukuk Census Area</td>\n",
" <td>17.140826</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9936</th>\n",
" <td>02290000400</td>\n",
" <td>Alaska</td>\n",
" <td>Yukon-Koyukuk Census Area</td>\n",
" <td>14.687448</td>\n",
" <td>5.77</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9893</th>\n",
" <td>02180000100</td>\n",
" <td>Alaska</td>\n",
" <td>Nome Census Area</td>\n",
" <td>13.377817</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9847</th>\n",
" <td>02164000100</td>\n",
" <td>Alaska</td>\n",
" <td>Lake and Peninsula Borough</td>\n",
" <td>13.061644</td>\n",
" <td>5.33</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9918</th>\n",
" <td>02261000100</td>\n",
" <td>Alaska</td>\n",
" <td>Valdez-Cordova Census Area</td>\n",
" <td>11.118835</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9945</th>\n",
" <td>02050000100</td>\n",
" <td>Alaska</td>\n",
" <td>Bethel Census Area</td>\n",
" <td>10.951888</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9841</th>\n",
" <td>02270000100</td>\n",
" <td>Alaska</td>\n",
" <td>Wade Hampton Census Area</td>\n",
" <td>8.771806</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9839</th>\n",
" <td>02240000100</td>\n",
" <td>Alaska</td>\n",
" <td>Southeast Fairbanks Census Area</td>\n",
" <td>8.613690</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9843</th>\n",
" <td>02070000100</td>\n",
" <td>Alaska</td>\n",
" <td>Dillingham Census Area</td>\n",
" <td>8.575307</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9947</th>\n",
" <td>02050000300</td>\n",
" <td>Alaska</td>\n",
" <td>Bethel Census Area</td>\n",
" <td>8.408040</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9899</th>\n",
" <td>02170000101</td>\n",
" <td>Alaska</td>\n",
" <td>Matanuska-Susitna Borough</td>\n",
" <td>6.480444</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9944</th>\n",
" <td>02068000100</td>\n",
" <td>Alaska</td>\n",
" <td>Denali Borough</td>\n",
" <td>5.997236</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9836</th>\n",
" <td>02013000100</td>\n",
" <td>Alaska</td>\n",
" <td>Aleutians East Borough</td>\n",
" <td>5.487726</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9921</th>\n",
" <td>02122000100</td>\n",
" <td>Alaska</td>\n",
" <td>Kenai Peninsula Borough</td>\n",
" <td>4.831831</td>\n",
" <td>6.10</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9851</th>\n",
" <td>02150000100</td>\n",
" <td>Alaska</td>\n",
" <td>Kodiak Island Borough</td>\n",
" <td>4.664009</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9850</th>\n",
" <td>02105000300</td>\n",
" <td>Alaska</td>\n",
" <td>Hoonah-Angoon Census Area</td>\n",
" <td>4.305716</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9838</th>\n",
" <td>02016000100</td>\n",
" <td>Alaska</td>\n",
" <td>Aleutians West Census Area</td>\n",
" <td>4.053520</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9917</th>\n",
" <td>02282000100</td>\n",
" <td>Alaska</td>\n",
" <td>Yakutat City and Borough</td>\n",
" <td>3.926182</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9920</th>\n",
" <td>02261000300</td>\n",
" <td>Alaska</td>\n",
" <td>Valdez-Cordova Census Area</td>\n",
" <td>3.285482</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9840</th>\n",
" <td>02240000400</td>\n",
" <td>Alaska</td>\n",
" <td>Southeast Fairbanks Census Area</td>\n",
" <td>3.233961</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9919</th>\n",
" <td>02261000200</td>\n",
" <td>Alaska</td>\n",
" <td>Valdez-Cordova Census Area</td>\n",
" <td>3.156317</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10354</th>\n",
" <td>41045970900</td>\n",
" <td>Oregon</td>\n",
" <td>Malheur County</td>\n",
" <td>2.731719</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9888</th>\n",
" <td>02198000100</td>\n",
" <td>Alaska</td>\n",
" <td>Prince of Wales-Hyder Census Area</td>\n",
" <td>2.606286</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10212</th>\n",
" <td>41025960200</td>\n",
" <td>Oregon</td>\n",
" <td>Harney County</td>\n",
" <td>2.568943</td>\n",
" <td>7.08</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9844</th>\n",
" <td>02185000300</td>\n",
" <td>Alaska</td>\n",
" <td>North Slope Borough</td>\n",
" <td>2.463165</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9858</th>\n",
" <td>02130000100</td>\n",
" <td>Alaska</td>\n",
" <td>Ketchikan Gateway Borough</td>\n",
" <td>2.440051</td>\n",
" <td>0.00</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" GEOID10 SF CF area zlfc\n",
"9846 02185000200 Alaska North Slope Borough 53.323702 4.45\n",
"9937 02290000100 Alaska Yukon-Koyukuk Census Area 21.653154 5.50\n",
"9857 02188000100 Alaska Northwest Arctic Borough 21.188159 5.50\n",
"9935 02290000200 Alaska Yukon-Koyukuk Census Area 20.744770 5.38\n",
"9934 02290000300 Alaska Yukon-Koyukuk Census Area 17.140826 0.00\n",
"9936 02290000400 Alaska Yukon-Koyukuk Census Area 14.687448 5.77\n",
"9893 02180000100 Alaska Nome Census Area 13.377817 0.00\n",
"9847 02164000100 Alaska Lake and Peninsula Borough 13.061644 5.33\n",
"9918 02261000100 Alaska Valdez-Cordova Census Area 11.118835 0.00\n",
"9945 02050000100 Alaska Bethel Census Area 10.951888 0.00\n",
"9841 02270000100 Alaska Wade Hampton Census Area 8.771806 0.00\n",
"9839 02240000100 Alaska Southeast Fairbanks Census Area 8.613690 0.00\n",
"9843 02070000100 Alaska Dillingham Census Area 8.575307 0.00\n",
"9947 02050000300 Alaska Bethel Census Area 8.408040 0.00\n",
"9899 02170000101 Alaska Matanuska-Susitna Borough 6.480444 0.00\n",
"9944 02068000100 Alaska Denali Borough 5.997236 0.00\n",
"9836 02013000100 Alaska Aleutians East Borough 5.487726 0.00\n",
"9921 02122000100 Alaska Kenai Peninsula Borough 4.831831 6.10\n",
"9851 02150000100 Alaska Kodiak Island Borough 4.664009 0.00\n",
"9850 02105000300 Alaska Hoonah-Angoon Census Area 4.305716 0.00\n",
"9838 02016000100 Alaska Aleutians West Census Area 4.053520 0.00\n",
"9917 02282000100 Alaska Yakutat City and Borough 3.926182 0.00\n",
"9920 02261000300 Alaska Valdez-Cordova Census Area 3.285482 0.00\n",
"9840 02240000400 Alaska Southeast Fairbanks Census Area 3.233961 0.00\n",
"9919 02261000200 Alaska Valdez-Cordova Census Area 3.156317 0.00\n",
"10354 41045970900 Oregon Malheur County 2.731719 0.00\n",
"9888 02198000100 Alaska Prince of Wales-Hyder Census Area 2.606286 0.00\n",
"10212 41025960200 Oregon Harney County 2.568943 7.08\n",
"9844 02185000300 Alaska North Slope Borough 2.463165 0.00\n",
"9858 02130000100 Alaska Ketchikan Gateway Borough 2.440051 0.00"
]
},
"execution_count": 89,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"gdf['zlfc'] = 0\n",
"gdf.at[9846, 'zlfc'] = 4.45\n",
"gdf.at[10212, 'zlfc'] = 7.08\n",
"gdf.at[9937, 'zlfc'] = 5.5\n",
"gdf.at[9857, 'zlfc'] = 5.5\n",
"gdf.at[9935, 'zlfc'] = 5.38\n",
"gdf.at[9936, 'zlfc'] = 5.77\n",
"gdf.at[9921, 'zlfc'] = 6.1\n",
"gdf.at[9847, 'zlfc'] = 5.33\n",
"gdf_short = gdf[[\"GEOID10\", \"SF\", \"CF\", \"area\", \"zlfc\"]]\n",
"gdf_short_sorted = gdf_short.sort_values(by='area', ascending=False);\n",
"gdf_short_sorted.head(30)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "5930de0e",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.13"
}
},
"nbformat": 4,
"nbformat_minor": 5
}

View file

@ -150,7 +150,7 @@
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.6"
"version": "3.9.10"
}
},
"nbformat": 4,

View file

@ -9,23 +9,6 @@ GEOID_TRACT_FIELD = "GEOID10_TRACT"
STATE_FIELD = "State/Territory"
COUNTY_FIELD = "County Name"
# Score file field names
# Definition M fields
SCORE_M = "Definition M"
FINAL_SCORE_N_BOOLEAN = (
"Definition M community, including adjacency index tracts"
)
SCORE_M_COMMUNITIES = "Definition M (communities)"
M_CLIMATE = "Climate Factor (Definition M)"
M_ENERGY = "Energy Factor (Definition M)"
M_TRANSPORTATION = "Transportation Factor (Definition M)"
M_HOUSING = "Housing Factor (Definition M)"
M_POLLUTION = "Pollution Factor (Definition M)"
M_WATER = "Water Factor (Definition M)"
M_HEALTH = "Health Factor (Definition M)"
M_WORKFORCE = "Workforce Factor (Definition M)"
M_NON_WORKFORCE = "Any Non-Workforce Factor (Definition M)"
# Definition Narwhal fields
SCORE_N = "Definition N (communities)"
SCORE_N_COMMUNITIES = "Definition N (communities)"
@ -38,6 +21,9 @@ N_WATER = "Water Factor (Definition N)"
N_HEALTH = "Health Factor (Definition N)"
N_WORKFORCE = "Workforce Factor (Definition N)"
N_NON_WORKFORCE = "Any Non-Workforce Factor (Definition N)"
FINAL_SCORE_N_BOOLEAN = (
"Definition N community, including adjacency index tracts"
)
PERCENTILE = 90
MEDIAN_HOUSE_VALUE_PERCENTILE = 90
@ -545,22 +531,22 @@ LOW_LIFE_EXPECTANCY_LOW_INCOME_LOW_HIGHER_ED_FIELD = (
# Workforce
UNEMPLOYMENT_LOW_HS_EDUCATION_FIELD = (
f"Greater than or equal to the {PERCENTILE}th percentile for unemployment"
" and has low HS education?"
" and has low HS attainment?"
)
LINGUISTIC_ISOLATION_LOW_HS_EDUCATION_FIELD = (
f"Greater than or equal to the {PERCENTILE}th percentile for households in linguistic isolation"
" and has low HS education?"
" and has low HS attainment?"
)
POVERTY_LOW_HS_EDUCATION_FIELD = (
f"Greater than or equal to the {PERCENTILE}th percentile for households at or below 100% federal poverty level"
" and has low HS education?"
" and has low HS attainment?"
)
LOW_MEDIAN_INCOME_LOW_HS_EDUCATION_FIELD = (
f"Greater than or equal to the {PERCENTILE}th percentile for low median household income as a "
f"percent of area median income and has low HS education?"
f"percent of area median income and has low HS attainment?"
)
# Score M Workforce Variables

View file

@ -1,5 +1,4 @@
import pandas as pd
from data_pipeline.score.score_m import ScoreM
from data_pipeline.score.score_narwhal import ScoreNarwhal
from data_pipeline.utils import get_module_logger
@ -13,8 +12,6 @@ class ScoreRunner:
self.df = df
def calculate_scores(self) -> pd.DataFrame:
# Index scores
self.df = ScoreM(df=self.df).add_columns()
self.df = ScoreNarwhal(df=self.df).add_columns()
return self.df