{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Distributions\n", "> A Summary of lecture \"Exploratory Data Analysis in Python\", via datacamp\n", "\n", "- toc: true \n", "- badges: true\n", "- comments: true\n", "- author: Chanseok Kang\n", "- categories: [Python, Datacamp]\n", "- image: images/income-cdf.png" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Probability mass functions" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "from empiricaldist import Pmf, Cdf\n", "from scipy.stats import norm" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | year | \n", "age | \n", "cohort | \n", "sex | \n", "race | \n", "educ | \n", "realinc | \n", "gunlaw | \n", "grass | \n", "wtssall | \n", "
---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1972 | \n", "26.0 | \n", "1946.0 | \n", "1 | \n", "1 | \n", "18.0 | \n", "13537.0 | \n", "2.0 | \n", "NaN | \n", "0.8893 | \n", "
1 | \n", "1972 | \n", "38.0 | \n", "1934.0 | \n", "2 | \n", "1 | \n", "12.0 | \n", "18951.0 | \n", "1.0 | \n", "NaN | \n", "0.4446 | \n", "
2 | \n", "1972 | \n", "57.0 | \n", "1915.0 | \n", "1 | \n", "1 | \n", "12.0 | \n", "30458.0 | \n", "1.0 | \n", "NaN | \n", "1.3339 | \n", "
3 | \n", "1972 | \n", "61.0 | \n", "1911.0 | \n", "2 | \n", "1 | \n", "14.0 | \n", "37226.0 | \n", "1.0 | \n", "NaN | \n", "0.8893 | \n", "
4 | \n", "1972 | \n", "59.0 | \n", "1913.0 | \n", "1 | \n", "1 | \n", "12.0 | \n", "30458.0 | \n", "2.0 | \n", "NaN | \n", "0.8893 | \n", "