{ "metadata": { "name": "", "signature": "sha256:0dc6444fa70583def6226d897aa5534149ac315405391aff8cd17de1ead9f116" }, "nbformat": 3, "nbformat_minor": 0, "worksheets": [ { "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Applying Operations Over pandas Dataframes\n", "\n", "- **Author:** [Chris Albon](http://www.chrisalbon.com/), [@ChrisAlbon](https://twitter.com/chrisalbon)\n", "- **Date:** -\n", "- **Repo:** [Python 3 code snippets for data science](https://github.com/chrisalbon/code_py)\n", "- **Note:**" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### Import Modules" ] }, { "cell_type": "code", "collapsed": false, "input": [ "import pandas as pd\n", "import numpy as np" ], "language": "python", "metadata": {}, "outputs": [], "prompt_number": 72 }, { "cell_type": "markdown", "metadata": {}, "source": [ "### Create a dataframe" ] }, { "cell_type": "code", "collapsed": false, "input": [ "data = {'name': ['Jason', 'Molly', 'Tina', 'Jake', 'Amy'], \n", " 'year': [2012, 2012, 2013, 2014, 2014], \n", " 'reports': [4, 24, 31, 2, 3],\n", " 'coverage': [25, 94, 57, 62, 70]}\n", "df = pd.DataFrame(data, index = ['Cochice', 'Pima', 'Santa Cruz', 'Maricopa', 'Yuma'])\n", "df" ], "language": "python", "metadata": {}, "outputs": [ { "html": [ "
\n", " | coverage | \n", "name | \n", "reports | \n", "year | \n", "
---|---|---|---|---|
Cochice | \n", "25 | \n", "Jason | \n", "4 | \n", "2012 | \n", "
Pima | \n", "94 | \n", "Molly | \n", "24 | \n", "2012 | \n", "
Santa Cruz | \n", "57 | \n", "Tina | \n", "31 | \n", "2013 | \n", "
Maricopa | \n", "62 | \n", "Jake | \n", "2 | \n", "2014 | \n", "
Yuma | \n", "70 | \n", "Amy | \n", "3 | \n", "2014 | \n", "
5 rows \u00d7 4 columns
\n", "\n", " | coverage | \n", "reports | \n", "year | \n", "
---|---|---|---|
Cochice | \n", "5.000000 | \n", "2.000000 | \n", "44.855323 | \n", "
Pima | \n", "9.695360 | \n", "4.898979 | \n", "44.855323 | \n", "
Santa Cruz | \n", "7.549834 | \n", "5.567764 | \n", "44.866469 | \n", "
Maricopa | \n", "7.874008 | \n", "1.414214 | \n", "44.877611 | \n", "
Yuma | \n", "8.366600 | \n", "1.732051 | \n", "44.877611 | \n", "
5 rows \u00d7 3 columns
\n", "\n", " | coverage | \n", "reports | \n", "year | \n", "
---|---|---|---|
Cochice | \n", "2500 | \n", "400 | \n", "201200 | \n", "
Pima | \n", "9400 | \n", "2400 | \n", "201200 | \n", "
Santa Cruz | \n", "5700 | \n", "3100 | \n", "201300 | \n", "
Maricopa | \n", "6200 | \n", "200 | \n", "201400 | \n", "
Yuma | \n", "7000 | \n", "300 | \n", "201400 | \n", "
5 rows \u00d7 3 columns
\n", "