{ "metadata": { "name": "", "signature": "sha256:1c6173a6f0cec1737eb8ab133f3b3570ba765d9d236a56e865e46f9c36df1cea" }, "nbformat": 3, "nbformat_minor": 0, "worksheets": [ { "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Binning Data In Pandas\n", "\n", "- **Author:** [Chris Albon](http://www.chrisalbon.com/), [@ChrisAlbon](https://twitter.com/chrisalbon)\n", "- **Date:** -\n", "- **Repo:** [Python 3 code snippets for data science](https://github.com/chrisalbon/code_py)\n", "- **Note:**" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### import modules" ] }, { "cell_type": "code", "collapsed": false, "input": [ "import pandas as pd" ], "language": "python", "metadata": {}, "outputs": [], "prompt_number": 1 }, { "cell_type": "markdown", "metadata": {}, "source": [ "### Create dataframe" ] }, { "cell_type": "code", "collapsed": false, "input": [ "raw_data = {'regiment': ['Nighthawks', 'Nighthawks', 'Nighthawks', 'Nighthawks', 'Dragoons', 'Dragoons', 'Dragoons', 'Dragoons', 'Scouts', 'Scouts', 'Scouts', 'Scouts'], \n", " 'company': ['1st', '1st', '2nd', '2nd', '1st', '1st', '2nd', '2nd','1st', '1st', '2nd', '2nd'], \n", " 'name': ['Miller', 'Jacobson', 'Ali', 'Milner', 'Cooze', 'Jacon', 'Ryaner', 'Sone', 'Sloan', 'Piger', 'Riani', 'Ali'], \n", " 'preTestScore': [4, 24, 31, 2, 3, 4, 24, 31, 2, 3, 2, 3],\n", " 'postTestScore': [25, 94, 57, 62, 70, 25, 94, 57, 62, 70, 62, 70]}\n", "df = pd.DataFrame(raw_data, columns = ['regiment', 'company', 'name', 'preTestScore', 'postTestScore'])\n", "df" ], "language": "python", "metadata": {}, "outputs": [ { "html": [ "
\n", " | regiment | \n", "company | \n", "name | \n", "preTestScore | \n", "postTestScore | \n", "
---|---|---|---|---|---|
0 | \n", "Nighthawks | \n", "1st | \n", "Miller | \n", "4 | \n", "25 | \n", "
1 | \n", "Nighthawks | \n", "1st | \n", "Jacobson | \n", "24 | \n", "94 | \n", "
2 | \n", "Nighthawks | \n", "2nd | \n", "Ali | \n", "31 | \n", "57 | \n", "
3 | \n", "Nighthawks | \n", "2nd | \n", "Milner | \n", "2 | \n", "62 | \n", "
4 | \n", "Dragoons | \n", "1st | \n", "Cooze | \n", "3 | \n", "70 | \n", "
5 | \n", "Dragoons | \n", "1st | \n", "Jacon | \n", "4 | \n", "25 | \n", "
6 | \n", "Dragoons | \n", "2nd | \n", "Ryaner | \n", "24 | \n", "94 | \n", "
7 | \n", "Dragoons | \n", "2nd | \n", "Sone | \n", "31 | \n", "57 | \n", "
8 | \n", "Scouts | \n", "1st | \n", "Sloan | \n", "2 | \n", "62 | \n", "
9 | \n", "Scouts | \n", "1st | \n", "Piger | \n", "3 | \n", "70 | \n", "
10 | \n", "Scouts | \n", "2nd | \n", "Riani | \n", "2 | \n", "62 | \n", "
11 | \n", "Scouts | \n", "2nd | \n", "Ali | \n", "3 | \n", "70 | \n", "
12 rows \u00d7 5 columns
\n", "\n", " | regiment | \n", "company | \n", "name | \n", "preTestScore | \n", "postTestScore | \n", "scoresBinned | \n", "categories | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "Nighthawks | \n", "1st | \n", "Miller | \n", "4 | \n", "25 | \n", "(0, 25] | \n", "Low | \n", "
1 | \n", "Nighthawks | \n", "1st | \n", "Jacobson | \n", "24 | \n", "94 | \n", "(75, 100] | \n", "Great | \n", "
2 | \n", "Nighthawks | \n", "2nd | \n", "Ali | \n", "31 | \n", "57 | \n", "(50, 75] | \n", "Good | \n", "
3 | \n", "Nighthawks | \n", "2nd | \n", "Milner | \n", "2 | \n", "62 | \n", "(50, 75] | \n", "Good | \n", "
4 | \n", "Dragoons | \n", "1st | \n", "Cooze | \n", "3 | \n", "70 | \n", "(50, 75] | \n", "Good | \n", "
5 | \n", "Dragoons | \n", "1st | \n", "Jacon | \n", "4 | \n", "25 | \n", "(0, 25] | \n", "Low | \n", "
6 | \n", "Dragoons | \n", "2nd | \n", "Ryaner | \n", "24 | \n", "94 | \n", "(75, 100] | \n", "Great | \n", "
7 | \n", "Dragoons | \n", "2nd | \n", "Sone | \n", "31 | \n", "57 | \n", "(50, 75] | \n", "Good | \n", "
8 | \n", "Scouts | \n", "1st | \n", "Sloan | \n", "2 | \n", "62 | \n", "(50, 75] | \n", "Good | \n", "
9 | \n", "Scouts | \n", "1st | \n", "Piger | \n", "3 | \n", "70 | \n", "(50, 75] | \n", "Good | \n", "
10 | \n", "Scouts | \n", "2nd | \n", "Riani | \n", "2 | \n", "62 | \n", "(50, 75] | \n", "Good | \n", "
11 | \n", "Scouts | \n", "2nd | \n", "Ali | \n", "3 | \n", "70 | \n", "(50, 75] | \n", "Good | \n", "
12 rows \u00d7 7 columns
\n", "