{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Examples and Exercises from Think Stats, 2nd Edition\n", "\n", "http://thinkstats2.com\n", "\n", "Copyright 2016 Allen B. Downey\n", "\n", "MIT License: https://opensource.org/licenses/MIT\n" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "from __future__ import print_function, division\n", "\n", "import nsfg #importing the nsfg dataset" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Examples from Chapter 1\n", "\n", "Read NSFG data into a Pandas DataFrame." ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | caseid | \n", "pregordr | \n", "howpreg_n | \n", "howpreg_p | \n", "moscurrp | \n", "nowprgdk | \n", "pregend1 | \n", "pregend2 | \n", "nbrnaliv | \n", "multbrth | \n", "... | \n", "laborfor_i | \n", "religion_i | \n", "metro_i | \n", "basewgt | \n", "adj_mod_basewgt | \n", "finalwgt | \n", "secu_p | \n", "sest | \n", "cmintvw | \n", "totalwgt_lb | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1 | \n", "1 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "6.0 | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "3410.389399 | \n", "3869.349602 | \n", "6448.271112 | \n", "2 | \n", "9 | \n", "NaN | \n", "8.8125 | \n", "
1 | \n", "1 | \n", "2 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "6.0 | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "3410.389399 | \n", "3869.349602 | \n", "6448.271112 | \n", "2 | \n", "9 | \n", "NaN | \n", "7.8750 | \n", "
2 | \n", "2 | \n", "1 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "5.0 | \n", "NaN | \n", "3.0 | \n", "5.0 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "7226.301740 | \n", "8567.549110 | \n", "12999.542264 | \n", "2 | \n", "12 | \n", "NaN | \n", "9.1250 | \n", "
3 | \n", "2 | \n", "2 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "6.0 | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "7226.301740 | \n", "8567.549110 | \n", "12999.542264 | \n", "2 | \n", "12 | \n", "NaN | \n", "7.0000 | \n", "
4 | \n", "2 | \n", "3 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "6.0 | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "7226.301740 | \n", "8567.549110 | \n", "12999.542264 | \n", "2 | \n", "12 | \n", "NaN | \n", "6.1875 | \n", "
5 rows × 244 columns
\n", "\n", " | caseid | \n", "rscrinf | \n", "rdormres | \n", "rostscrn | \n", "rscreenhisp | \n", "rscreenrace | \n", "age_a | \n", "age_r | \n", "cmbirth | \n", "agescrn | \n", "... | \n", "pubassis_i | \n", "basewgt | \n", "adj_mod_basewgt | \n", "finalwgt | \n", "secu_r | \n", "sest | \n", "cmintvw | \n", "cmlstyr | \n", "screentime | \n", "intvlngth | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "2298 | \n", "1 | \n", "5 | \n", "5 | \n", "1 | \n", "5.0 | \n", "27 | \n", "27 | \n", "902 | \n", "27 | \n", "... | \n", "0 | \n", "3247.916977 | \n", "5123.759559 | \n", "5556.717241 | \n", "2 | \n", "18 | \n", "1234 | \n", "1222 | \n", "18:26:36 | \n", "110.492667 | \n", "
1 | \n", "5012 | \n", "1 | \n", "5 | \n", "1 | \n", "5 | \n", "5.0 | \n", "42 | \n", "42 | \n", "718 | \n", "42 | \n", "... | \n", "0 | \n", "2335.279149 | \n", "2846.799490 | \n", "4744.191350 | \n", "2 | \n", "18 | \n", "1233 | \n", "1221 | \n", "16:30:59 | \n", "64.294000 | \n", "
2 | \n", "11586 | \n", "1 | \n", "5 | \n", "1 | \n", "5 | \n", "5.0 | \n", "43 | \n", "43 | \n", "708 | \n", "43 | \n", "... | \n", "0 | \n", "2335.279149 | \n", "2846.799490 | \n", "4744.191350 | \n", "2 | \n", "18 | \n", "1234 | \n", "1222 | \n", "18:19:09 | \n", "75.149167 | \n", "
3 | \n", "6794 | \n", "5 | \n", "5 | \n", "4 | \n", "1 | \n", "5.0 | \n", "15 | \n", "15 | \n", "1042 | \n", "15 | \n", "... | \n", "0 | \n", "3783.152221 | \n", "5071.464231 | \n", "5923.977368 | \n", "2 | \n", "18 | \n", "1234 | \n", "1222 | \n", "15:54:43 | \n", "28.642833 | \n", "
4 | \n", "616 | \n", "1 | \n", "5 | \n", "4 | \n", "1 | \n", "5.0 | \n", "20 | \n", "20 | \n", "991 | \n", "20 | \n", "... | \n", "0 | \n", "5341.329968 | \n", "6437.335772 | \n", "7229.128072 | \n", "2 | \n", "18 | \n", "1233 | \n", "1221 | \n", "14:19:44 | \n", "69.502667 | \n", "
5 rows × 3087 columns
\n", "\n", " | caseid | \n", "rscrinf | \n", "rdormres | \n", "rostscrn | \n", "rscreenhisp | \n", "rscreenrace | \n", "age_a | \n", "age_r | \n", "cmbirth | \n", "agescrn | \n", "... | \n", "pubassis_i | \n", "basewgt | \n", "adj_mod_basewgt | \n", "finalwgt | \n", "secu_r | \n", "sest | \n", "cmintvw | \n", "cmlstyr | \n", "screentime | \n", "intvlngth | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "2298 | \n", "1 | \n", "5 | \n", "5 | \n", "1 | \n", "5.0 | \n", "27 | \n", "27 | \n", "902 | \n", "27 | \n", "... | \n", "0 | \n", "3247.916977 | \n", "5123.759559 | \n", "5556.717241 | \n", "2 | \n", "18 | \n", "1234 | \n", "1222 | \n", "18:26:36 | \n", "110.492667 | \n", "
1 rows × 3087 columns
\n", "\n", " | caseid | \n", "pregordr | \n", "howpreg_n | \n", "howpreg_p | \n", "moscurrp | \n", "nowprgdk | \n", "pregend1 | \n", "pregend2 | \n", "nbrnaliv | \n", "multbrth | \n", "... | \n", "religion_i | \n", "metro_i | \n", "basewgt | \n", "adj_mod_basewgt | \n", "finalwgt | \n", "secu_p | \n", "sest | \n", "cmintvw | \n", "totalwgt_lb | \n", "totalwgt_kg | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
2610 | \n", "2298 | \n", "1 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "6.0 | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "... | \n", "0 | \n", "0 | \n", "3247.916977 | \n", "5123.759559 | \n", "5556.717241 | \n", "2 | \n", "18 | \n", "NaN | \n", "6.8750 | \n", "15.1250 | \n", "
2611 | \n", "2298 | \n", "2 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "6.0 | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "... | \n", "0 | \n", "0 | \n", "3247.916977 | \n", "5123.759559 | \n", "5556.717241 | \n", "2 | \n", "18 | \n", "NaN | \n", "5.5000 | \n", "12.1000 | \n", "
2612 | \n", "2298 | \n", "3 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "6.0 | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "... | \n", "0 | \n", "0 | \n", "3247.916977 | \n", "5123.759559 | \n", "5556.717241 | \n", "2 | \n", "18 | \n", "NaN | \n", "4.1875 | \n", "9.2125 | \n", "
2613 | \n", "2298 | \n", "4 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "6.0 | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "... | \n", "0 | \n", "0 | \n", "3247.916977 | \n", "5123.759559 | \n", "5556.717241 | \n", "2 | \n", "18 | \n", "NaN | \n", "6.8750 | \n", "15.1250 | \n", "
4 rows × 245 columns
\n", "