{ "metadata": { "name": "", "signature": "sha256:573cd9578967856f7dcd1df55351af8d3c475a4e3794ba81be885388f876b1a7" }, "nbformat": 3, "nbformat_minor": 0, "worksheets": [ { "cells": [ { "cell_type": "code", "collapsed": false, "input": [ "from IPython.core.display import HTML\n", "\n", "with open('creative_commons.txt', 'r') as f:\n", " html = f.read()\n", " \n", "name = '2014-06-16-seaborn'\n", "\n", "html = '''\n", "\n", "
This post was written as an IPython notebook.\n", " It is available for download\n", " or as a static html.
\n", "\n", "%s''' % (name, name, html)\n", "\n", "%matplotlib inline\n", "from matplotlib import style\n", "style.use('ggplot')" ], "language": "python", "metadata": {}, "outputs": [], "prompt_number": 1 }, { "cell_type": "markdown", "metadata": {}, "source": [ "This week I was helping a friend to explore her data-set with some simple\n", "statistics and plots. So I decided to try\n", "[seaborn](http://web.stanford.edu/~mwaskom/software/seaborn/index.html) out.\n", "\n", "It is a really nice library that, together with pandas, becomes a powerful tool\n", "to take the first steps while exploring your data.\n", "\n", "Here is a simple example of what we did." ] }, { "cell_type": "code", "collapsed": false, "input": [ "import seaborn\n", "import numpy as np\n", "import matplotlib.pyplot as plt\n", "\n", "from io import BytesIO\n", "from pandas import read_csv" ], "language": "python", "metadata": {}, "outputs": [], "prompt_number": 2 }, { "cell_type": "code", "collapsed": false, "input": [ "kw = dict(na_values='NaN', sep=',', encoding='utf-8',\n", " skipinitialspace=True, index_col=False)\n", "\n", "df = read_csv(\"./data/fish.csv\", **kw)" ], "language": "python", "metadata": {}, "outputs": [], "prompt_number": 3 }, { "cell_type": "code", "collapsed": false, "input": [ "df.head()" ], "language": "python", "metadata": {}, "outputs": [ { "html": [ "\n", " | Days | \n", "ID | \n", "Recovery | \n", "Extract weight | \n", "Lipid % | \n", "Weight (g) | \n", "Size (cm) | \n", "Liver weight (g) | \n", "LSI | \n", "CF | \n", "BDE 47 (ng/g) | \n", "BDE 99 (ng/g) | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0 | \n", "A | \n", "73.21 | \n", "0.10 | \n", "3.600000 | \n", "20.09 | \n", "12.8 | \n", "0.14 | \n", "0.696864 | \n", "0.957966 | \n", "0 | \n", "0 | \n", "
1 | \n", "0 | \n", "B | \n", "98.24 | \n", "0.22 | \n", "2.272727 | \n", "36.52 | \n", "15.5 | \n", "0.33 | \n", "0.903614 | \n", "0.980699 | \n", "0 | \n", "0 | \n", "
2 | \n", "0 | \n", "C | \n", "89.71 | \n", "0.18 | \n", "3.500000 | \n", "28.74 | \n", "14.7 | \n", "0.25 | \n", "0.869868 | \n", "0.904763 | \n", "0 | \n", "0 | \n", "
3 | \n", "1 | \n", "A | \n", "78.40 | \n", "0.13 | \n", "1.330769 | \n", "23.70 | \n", "14.0 | \n", "0.15 | \n", "0.632911 | \n", "0.863703 | \n", "0 | \n", "0 | \n", "
4 | \n", "1 | \n", "B | \n", "66.24 | \n", "0.13 | \n", "2.838462 | \n", "32.80 | \n", "15.0 | \n", "0.20 | \n", "0.609756 | \n", "0.971852 | \n", "0 | \n", "0 | \n", "
\n", " | \n", " | BDE 47 (ng/g) | \n", "BDE 99 (ng/g) | \n", "CF | \n", "Extract weight | \n", "LSI | \n", "Lipid % | \n", "Liver weight (g) | \n", "Recovery | \n", "Size (cm) | \n", "Weight (g) | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|
Days | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
0 | \n", "count | \n", "3 | \n", "3 | \n", "3.000000 | \n", "3.000000 | \n", "3.000000 | \n", "3.000000 | \n", "3.000000 | \n", "3.000000 | \n", "3.000000 | \n", "3.000000 | \n", "
mean | \n", "0 | \n", "0 | \n", "0.947809 | \n", "0.166667 | \n", "0.823449 | \n", "3.124242 | \n", "0.240000 | \n", "87.053333 | \n", "14.333333 | \n", "28.450000 | \n", "|
std | \n", "0 | \n", "0 | \n", "0.038974 | \n", "0.061101 | \n", "0.110916 | \n", "0.739127 | \n", "0.095394 | \n", "12.724725 | \n", "1.386843 | \n", "8.218838 | \n", "|
min | \n", "0 | \n", "0 | \n", "0.904763 | \n", "0.100000 | \n", "0.696864 | \n", "2.272727 | \n", "0.140000 | \n", "73.210000 | \n", "12.800000 | \n", "20.090000 | \n", "|
25% | \n", "0 | \n", "0 | \n", "0.931364 | \n", "0.140000 | \n", "0.783366 | \n", "2.886364 | \n", "0.195000 | \n", "81.460000 | \n", "13.750000 | \n", "24.415000 | \n", "
This post was written as an IPython notebook.\n", " It is available for download\n", " or as a static html.
\n", "\n", "