{ "cells": [ { "cell_type": "code", "execution_count": 2, "id": "f0b6f7e2", "metadata": {}, "outputs": [], "source": [ "import geopandas as gpd\n", "import pyogrio\n", "from data_pipeline.etl.sources.census.etl import CensusETL\n", "from data_pipeline.etl.sources.tribal.etl import TribalETL\n", "\n", "import time\n", "\n", "begin = time.time()" ] }, { "cell_type": "code", "execution_count": 3, "id": "1e3e65af", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | tribalId | \n", "landAreaName | \n", "Classification | \n", "geometry | \n", "
---|---|---|---|---|
0 | \n", "LAR0001 | \n", "Cheyenne River LAR | \n", "1 | \n", "MULTIPOLYGON (((-100.49935 45.47125, -100.4993... | \n", "
1 | \n", "LAR0002 | \n", "Crow Creek LAR | \n", "1 | \n", "POLYGON ((-99.42137 44.27733, -99.42138 44.273... | \n", "
2 | \n", "LAR0003 | \n", "Flandreau LAR | \n", "1 | \n", "MULTIPOLYGON (((-96.56655 44.08786, -96.57165 ... | \n", "
3 | \n", "LAR0004 | \n", "Fort Berthold LAR | \n", "1 | \n", "POLYGON ((-102.78362 47.99900, -102.78192 47.9... | \n", "
4 | \n", "LAR0005 | \n", "Lake Traverse (Sisseton) LAR | \n", "1 | \n", "MULTIPOLYGON (((-97.28946 45.76084, -97.28955 ... | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
592 | \n", "{0886416F-643E-497E-89D3-E9CC0240158D} | \n", "Chilkat | \n", "None | \n", "POINT (-135.88440 59.40390) | \n", "
593 | \n", "{2029C35B-86D7-4751-A946-EA0772C81A80} | \n", "Chilkoot | \n", "None | \n", "POINT (-135.44500 59.23580) | \n", "
594 | \n", "{24DF6536-95CB-4964-94DF-16E440ABCA92} | \n", "Craig | \n", "None | \n", "POINT (-133.14830 55.47640) | \n", "
595 | \n", "{ACDE097A-9BDA-4FCA-9DB7-297DA6B73F88} | \n", "Douglas | \n", "None | \n", "POINT (-134.41970 58.30190) | \n", "
596 | \n", "{5E1D1895-FF41-4B11-9EDB-0C1254A360C4} | \n", "Agdaagux | \n", "None | \n", "POINT (-162.31030 55.06170) | \n", "
597 rows × 4 columns
\n", "\n", " | tribalId | \n", "landAreaName | \n", "Classification | \n", "geometry | \n", "
---|---|---|---|---|
0 | \n", "LAR0001 | \n", "Cheyenne River LAR | \n", "1 | \n", "MULTIPOLYGON (((-100.49935 45.47125, -100.4993... | \n", "
1 | \n", "LAR0002 | \n", "Crow Creek LAR | \n", "1 | \n", "POLYGON ((-99.42137 44.27733, -99.42138 44.273... | \n", "
2 | \n", "LAR0003 | \n", "Flandreau LAR | \n", "1 | \n", "MULTIPOLYGON (((-96.56655 44.08786, -96.57165 ... | \n", "
3 | \n", "LAR0004 | \n", "Fort Berthold LAR | \n", "1 | \n", "POLYGON ((-102.78362 47.99900, -102.78192 47.9... | \n", "
4 | \n", "LAR0005 | \n", "Lake Traverse (Sisseton) LAR | \n", "1 | \n", "MULTIPOLYGON (((-97.28946 45.76084, -97.28955 ... | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
365 | \n", "TSA0354 | \n", "Seminole TSA | \n", "None | \n", "POLYGON ((-96.49048 34.90423, -96.49146 34.903... | \n", "
366 | \n", "TSA0355 | \n", "Seneca Cayuga TSA | \n", "None | \n", "POLYGON ((-94.61803 36.62531, -94.62083 36.625... | \n", "
367 | \n", "TSA0356 | \n", "Tonkawa TSA | \n", "None | \n", "POLYGON ((-97.24698 36.68082, -97.24697 36.677... | \n", "
368 | \n", "TSA0357 | \n", "Wichita Caddo and Delaware TSA | \n", "None | \n", "POLYGON ((-97.99931 35.36425, -97.99948 35.360... | \n", "
369 | \n", "TSA0358 | \n", "Wyandotte TSA | \n", "None | \n", "POLYGON ((-94.61820 36.82030, -94.61821 36.816... | \n", "
370 rows × 4 columns
\n", "\n", " | STATEFP10 | \n", "COUNTYFP10 | \n", "TRACTCE10 | \n", "GEOID10 | \n", "NAME10 | \n", "NAMELSAD10 | \n", "MTFCC10 | \n", "FUNCSTAT10 | \n", "ALAND10 | \n", "AWATER10 | \n", "INTPTLAT10 | \n", "INTPTLON10 | \n", "geometry | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "20 | \n", "071 | \n", "958100 | \n", "20071958100 | \n", "9581 | \n", "Census Tract 9581 | \n", "G5020 | \n", "S | \n", "2016176814 | \n", "0 | \n", "+38.4804076 | \n", "-101.8059837 | \n", "POLYGON ((-101.79971 38.69806, -101.79097 38.6... | \n", "
1 | \n", "20 | \n", "175 | \n", "965600 | \n", "20175965600 | \n", "9656 | \n", "Census Tract 9656 | \n", "G5020 | \n", "S | \n", "1603575701 | \n", "2204351 | \n", "+37.1805849 | \n", "-100.8547406 | \n", "POLYGON ((-101.06766 37.20440, -101.06768 37.2... | \n", "
2 | \n", "20 | \n", "175 | \n", "965700 | \n", "20175965700 | \n", "9657 | \n", "Census Tract 9657 | \n", "G5020 | \n", "S | \n", "9466451 | \n", "358282 | \n", "+37.0625361 | \n", "-100.9131437 | \n", "POLYGON ((-100.94250 37.06497, -100.94251 37.0... | \n", "
3 | \n", "20 | \n", "043 | \n", "020300 | \n", "20043020300 | \n", "203 | \n", "Census Tract 203 | \n", "G5020 | \n", "S | \n", "211593206 | \n", "7045771 | \n", "+39.7881238 | \n", "-094.9734666 | \n", "POLYGON ((-94.95518 39.90129, -94.95475 39.901... | \n", "
4 | \n", "20 | \n", "043 | \n", "020200 | \n", "20043020200 | \n", "202 | \n", "Census Tract 202 | \n", "G5020 | \n", "S | \n", "352687026 | \n", "2968059 | \n", "+39.7540484 | \n", "-095.1060098 | \n", "POLYGON ((-95.02575 39.88295, -95.02585 39.883... | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
74129 | \n", "35 | \n", "049 | \n", "000600 | \n", "35049000600 | \n", "6 | \n", "Census Tract 6 | \n", "G5020 | \n", "S | \n", "1629471 | \n", "0 | \n", "+35.6758519 | \n", "-105.9446097 | \n", "POLYGON ((-105.95207 35.67367, -105.95215 35.6... | \n", "
74130 | \n", "35 | \n", "049 | \n", "000700 | \n", "35049000700 | \n", "7 | \n", "Census Tract 7 | \n", "G5020 | \n", "S | \n", "1285597 | \n", "0 | \n", "+35.6802004 | \n", "-105.9558818 | \n", "POLYGON ((-105.96221 35.67223, -105.96245 35.6... | \n", "
74131 | \n", "35 | \n", "049 | \n", "000800 | \n", "35049000800 | \n", "8 | \n", "Census Tract 8 | \n", "G5020 | \n", "S | \n", "1916797 | \n", "0 | \n", "+35.6805095 | \n", "-105.9703558 | \n", "POLYGON ((-105.98159 35.67739, -105.98143 35.6... | \n", "
74132 | \n", "35 | \n", "049 | \n", "000900 | \n", "35049000900 | \n", "9 | \n", "Census Tract 9 | \n", "G5020 | \n", "S | \n", "2545563 | \n", "0 | \n", "+35.6692966 | \n", "-105.9755351 | \n", "POLYGON ((-105.96362 35.67616, -105.96365 35.6... | \n", "
74133 | \n", "35 | \n", "049 | \n", "001001 | \n", "35049001001 | \n", "10.01 | \n", "Census Tract 10.01 | \n", "G5020 | \n", "S | \n", "2617281 | \n", "0 | \n", "+35.6647341 | \n", "-105.9468629 | \n", "POLYGON ((-105.94510 35.65705, -105.94563 35.6... | \n", "
74134 rows × 13 columns
\n", "\n", " | STATEFP10 | \n", "COUNTYFP10 | \n", "TRACTCE10 | \n", "GEOID10 | \n", "NAME10 | \n", "NAMELSAD10 | \n", "MTFCC10 | \n", "FUNCSTAT10 | \n", "ALAND10 | \n", "AWATER10 | \n", "INTPTLAT10 | \n", "INTPTLON10 | \n", "geometry | \n", "area_tract | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "20 | \n", "071 | \n", "958100 | \n", "20071958100 | \n", "9581 | \n", "Census Tract 9581 | \n", "G5020 | \n", "S | \n", "2016176814 | \n", "0 | \n", "+38.4804076 | \n", "-101.8059837 | \n", "POLYGON ((-101.79971 38.69806, -101.79097 38.6... | \n", "0.208156 | \n", "
1 | \n", "20 | \n", "175 | \n", "965600 | \n", "20175965600 | \n", "9656 | \n", "Census Tract 9656 | \n", "G5020 | \n", "S | \n", "1603575701 | \n", "2204351 | \n", "+37.1805849 | \n", "-100.8547406 | \n", "POLYGON ((-101.06766 37.20440, -101.06768 37.2... | \n", "0.162976 | \n", "
2 | \n", "20 | \n", "175 | \n", "965700 | \n", "20175965700 | \n", "9657 | \n", "Census Tract 9657 | \n", "G5020 | \n", "S | \n", "9466451 | \n", "358282 | \n", "+37.0625361 | \n", "-100.9131437 | \n", "POLYGON ((-100.94250 37.06497, -100.94251 37.0... | \n", "0.000995 | \n", "
3 | \n", "20 | \n", "043 | \n", "020300 | \n", "20043020300 | \n", "203 | \n", "Census Tract 203 | \n", "G5020 | \n", "S | \n", "211593206 | \n", "7045771 | \n", "+39.7881238 | \n", "-094.9734666 | \n", "POLYGON ((-94.95518 39.90129, -94.95475 39.901... | \n", "0.022990 | \n", "
4 | \n", "20 | \n", "043 | \n", "020200 | \n", "20043020200 | \n", "202 | \n", "Census Tract 202 | \n", "G5020 | \n", "S | \n", "352687026 | \n", "2968059 | \n", "+39.7540484 | \n", "-095.1060098 | \n", "POLYGON ((-95.02575 39.88295, -95.02585 39.883... | \n", "0.037373 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
74129 | \n", "35 | \n", "049 | \n", "000600 | \n", "35049000600 | \n", "6 | \n", "Census Tract 6 | \n", "G5020 | \n", "S | \n", "1629471 | \n", "0 | \n", "+35.6758519 | \n", "-105.9446097 | \n", "POLYGON ((-105.95207 35.67367, -105.95215 35.6... | \n", "0.000162 | \n", "
74130 | \n", "35 | \n", "049 | \n", "000700 | \n", "35049000700 | \n", "7 | \n", "Census Tract 7 | \n", "G5020 | \n", "S | \n", "1285597 | \n", "0 | \n", "+35.6802004 | \n", "-105.9558818 | \n", "POLYGON ((-105.96221 35.67223, -105.96245 35.6... | \n", "0.000128 | \n", "
74131 | \n", "35 | \n", "049 | \n", "000800 | \n", "35049000800 | \n", "8 | \n", "Census Tract 8 | \n", "G5020 | \n", "S | \n", "1916797 | \n", "0 | \n", "+35.6805095 | \n", "-105.9703558 | \n", "POLYGON ((-105.98159 35.67739, -105.98143 35.6... | \n", "0.000191 | \n", "
74132 | \n", "35 | \n", "049 | \n", "000900 | \n", "35049000900 | \n", "9 | \n", "Census Tract 9 | \n", "G5020 | \n", "S | \n", "2545563 | \n", "0 | \n", "+35.6692966 | \n", "-105.9755351 | \n", "POLYGON ((-105.96362 35.67616, -105.96365 35.6... | \n", "0.000253 | \n", "
74133 | \n", "35 | \n", "049 | \n", "001001 | \n", "35049001001 | \n", "10.01 | \n", "Census Tract 10.01 | \n", "G5020 | \n", "S | \n", "2617281 | \n", "0 | \n", "+35.6647341 | \n", "-105.9468629 | \n", "POLYGON ((-105.94510 35.65705, -105.94563 35.6... | \n", "0.000261 | \n", "
74134 rows × 14 columns
\n", "\n", " | STATEFP10 | \n", "COUNTYFP10 | \n", "TRACTCE10 | \n", "GEOID10 | \n", "NAME10 | \n", "NAMELSAD10 | \n", "MTFCC10 | \n", "FUNCSTAT10 | \n", "ALAND10 | \n", "AWATER10 | \n", "INTPTLAT10 | \n", "INTPTLON10 | \n", "area_tract | \n", "tribalId | \n", "landAreaName | \n", "Classification | \n", "geometry | \n", "area_joined | \n", "tribal_area_as_a_share_of_tract_area | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "20 | \n", "043 | \n", "020100 | \n", "20043020100 | \n", "201 | \n", "Census Tract 201 | \n", "G5020 | \n", "S | \n", "454634616.0 | \n", "2601186.0 | \n", "+39.8206800 | \n", "-095.2567279 | \n", "0.048098 | \n", "LAR0210 | \n", "Iowa LAR | \n", "1 | \n", "POLYGON ((-95.33994 39.97506, -95.33994 39.975... | \n", "4.998139e-04 | \n", "0.010391 | \n", "
1 | \n", "20 | \n", "013 | \n", "480600 | \n", "20013480600 | \n", "4806 | \n", "Census Tract 4806 | \n", "G5020 | \n", "S | \n", "882293538.0 | \n", "1376818.0 | \n", "+39.8596443 | \n", "-095.6255187 | \n", "0.093019 | \n", "LAR0210 | \n", "Iowa LAR | \n", "1 | \n", "POLYGON ((-95.45656 40.00025, -95.45528 40.000... | \n", "3.209294e-03 | \n", "0.034502 | \n", "
2 | \n", "31 | \n", "147 | \n", "964500 | \n", "31147964500 | \n", "9645 | \n", "Census Tract 9645 | \n", "G5020 | \n", "S | \n", "677848509.0 | \n", "6076731.0 | \n", "+40.1522236 | \n", "-095.5858870 | \n", "0.072289 | \n", "LAR0210 | \n", "Iowa LAR | \n", "1 | \n", "MULTIPOLYGON (((-95.38162 40.02744, -95.38119 ... | \n", "1.476624e-03 | \n", "0.020427 | \n", "
3 | \n", "29 | \n", "087 | \n", "960300 | \n", "29087960300 | \n", "9603 | \n", "Census Tract 9603 | \n", "G5020 | \n", "S | \n", "412869716.0 | \n", "6745159.0 | \n", "+39.9730230 | \n", "-095.1479701 | \n", "0.044239 | \n", "LAR0210 | \n", "Iowa LAR | \n", "1 | \n", "POLYGON ((-95.38119 40.02755, -95.38162 40.027... | \n", "1.965514e-07 | \n", "0.000004 | \n", "
4 | \n", "20 | \n", "085 | \n", "082600 | \n", "20085082600 | \n", "826 | \n", "Census Tract 826 | \n", "G5020 | \n", "S | \n", "690868809.0 | \n", "947758.0 | \n", "+39.4553966 | \n", "-095.6731404 | \n", "0.072404 | \n", "LAR0211 | \n", "Kickapoo (Kansas) LAR | \n", "1 | \n", "POLYGON ((-95.71031 39.65308, -95.69902 39.653... | \n", "5.285627e-06 | \n", "0.000073 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
76317 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "TSA0353 | \n", "Sac and Fox TSA | \n", "None | \n", "MULTIPOLYGON (((-96.62002 35.75143, -96.62001 ... | \n", "6.560647e-17 | \n", "NaN | \n", "
76318 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "TSA0354 | \n", "Seminole TSA | \n", "None | \n", "MULTIPOLYGON (((-96.77536 35.03300, -96.77536 ... | \n", "7.207055e-18 | \n", "NaN | \n", "
76319 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "TSA0355 | \n", "Seneca Cayuga TSA | \n", "None | \n", "POLYGON ((-94.61836 36.74340, -94.61836 36.743... | \n", "7.016721e-18 | \n", "NaN | \n", "
76320 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "TSA0356 | \n", "Tonkawa TSA | \n", "None | \n", "MULTIPOLYGON (((-97.24698 36.69942, -97.24692 ... | \n", "2.612218e-17 | \n", "NaN | \n", "
76321 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "TSA0358 | \n", "Wyandotte TSA | \n", "None | \n", "POLYGON ((-94.61828 36.78970, -94.61834 36.795... | \n", "1.555259e-18 | \n", "NaN | \n", "
76322 rows × 19 columns
\n", "