{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Sample workflow: 1990 block group parts to 2010 counties\n", "\n", "## Starting from a subset of 2010 Delaware blocks\n", "\n", "For further background information see:\n", "* **Schroeder, J. P**. 2007. *Target-density weighting interpolation and uncertainty evaluation for temporal analysis of census data*. Geographical Analysis 39 (3):311–335.\n", "\n", "#### NHGIS [block crosswalks](https://www.nhgis.org/user-resources/geographic-crosswalks)" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "ExecuteTime": { "end_time": "2020-06-22T00:09:36.595166Z", "start_time": "2020-06-22T00:09:36.562841Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "2020-06-21T20:09:36-04:00\n", "\n", "CPython 3.7.6\n", "IPython 7.15.0\n", "\n", "compiler : Clang 9.0.1 \n", "system : Darwin\n", "release : 19.5.0\n", "machine : x86_64\n", "processor : i386\n", "CPU cores : 8\n", "interpreter: 64bit\n" ] } ], "source": [ "%load_ext watermark\n", "%watermark" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "ExecuteTime": { "end_time": "2020-06-22T00:09:37.352276Z", "start_time": "2020-06-22T00:09:37.073590Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "watermark 2.0.2\n", "nhgisxwalk 0.0.5\n", "numpy 1.18.5\n", "pandas 1.0.4\n", "\n" ] } ], "source": [ "import nhgisxwalk\n", "import inspect\n", "import numpy\n", "import pandas\n", "\n", "%load_ext autoreload\n", "%autoreload 2\n", "%watermark -w\n", "%watermark -iv" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### Source and target years for the crosswalk" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "ExecuteTime": { "end_time": "2020-06-22T00:09:38.160877Z", "start_time": "2020-06-22T00:09:38.130399Z" } }, "outputs": [], "source": [ "source_year, target_year = \"1990\", \"2010\"" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### Source-target building base" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "ExecuteTime": { "end_time": "2020-06-22T00:09:38.965841Z", "start_time": "2020-06-22T00:09:38.874865Z" } }, "outputs": [ { "data": { "text/html": [ "
| \n", " | GJOIN1990 | \n", "GJOIN2010 | \n", "WEIGHT | \n", "PAREA_VIA_BLK00 | \n", "
|---|---|---|---|---|
| 0 | \n", "NaN | \n", "G10000100432021078 | \n", "0.0 | \n", "0.0 | \n", "
| 1 | \n", "NaN | \n", "G10000100432023014 | \n", "0.0 | \n", "0.0 | \n", "
| 2 | \n", "NaN | \n", "G10000100432023015 | \n", "0.0 | \n", "0.0 | \n", "
| 3 | \n", "NaN | \n", "G10000109900000011 | \n", "0.0 | \n", "0.0 | \n", "
| 4 | \n", "NaN | \n", "G10000109900000012 | \n", "0.0 | \n", "0.0 | \n", "
| \n", " | bgp1990gj | \n", "cty2010gj | \n", "cty2010ge | \n", "wt_pop | \n", "wt_fam | \n", "wt_hh | \n", "wt_hu | \n", "
|---|---|---|---|---|---|---|---|
| 0 | \n", "G100001090444072500423009999999999921 | \n", "G1000010 | \n", "10001 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 1 | \n", "G100001090444444300422009999999999926 | \n", "G1000010 | \n", "10001 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 2 | \n", "G100001090444612650422009999999219011 | \n", "G1000010 | \n", "10001 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 3 | \n", "G100001090444612650422009999999219012 | \n", "G1000010 | \n", "10001 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 4 | \n", "G100001090444614800422009999999999924 | \n", "G1000010 | \n", "10001 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 772 | \n", "G100005093552999990515009999999999922 | \n", "G1000050 | \n", "10005 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 773 | \n", "G100005093552999990515009999999999923 | \n", "G1000050 | \n", "10005 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 774 | \n", "G100005093552999990515009999999999924 | \n", "G1000050 | \n", "10005 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 775 | \n", "G100005093552999990516009999999999921 | \n", "G1000050 | \n", "10005 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 776 | \n", "G340033010610106000204029999999916014 | \n", "G1000030 | \n", "10003 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "
777 rows × 7 columns
\n", "| \n", " | bgp1990gj | \n", "cty2010gj | \n", "cty2010ge | \n", "wt_pop | \n", "wt_fam | \n", "wt_hh | \n", "wt_hu | \n", "
|---|---|---|---|---|---|---|---|
| 0 | \n", "G100001090444072500423009999999999921 | \n", "G1000010 | \n", "10001 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 1 | \n", "G100001090444444300422009999999999926 | \n", "G1000010 | \n", "10001 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 2 | \n", "G100001090444612650422009999999219011 | \n", "G1000010 | \n", "10001 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 3 | \n", "G100001090444612650422009999999219012 | \n", "G1000010 | \n", "10001 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 4 | \n", "G100001090444614800422009999999999924 | \n", "G1000010 | \n", "10001 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 772 | \n", "G100005093552999990515009999999999922 | \n", "G1000050 | \n", "10005 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 773 | \n", "G100005093552999990515009999999999923 | \n", "G1000050 | \n", "10005 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 774 | \n", "G100005093552999990515009999999999924 | \n", "G1000050 | \n", "10005 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 775 | \n", "G100005093552999990516009999999999921 | \n", "G1000050 | \n", "10005 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
| 776 | \n", "G340033010610106000204029999999916014 | \n", "G1000030 | \n", "10003 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "
777 rows × 7 columns
\n", "