{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "## Imports" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "collapsed": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "0.20.3\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "/usr/local/lib/python2.7/dist-packages/sklearn/cross_validation.py:41: DeprecationWarning: This module was deprecated in version 0.18 in favor of the model_selection module into which all the refactored classes and functions are moved. Also note that the interface of the new CV iterators are different from that of this module. This module will be removed in 0.20.\n", " \"This module will be removed in 0.20.\", DeprecationWarning)\n" ] } ], "source": [ "import pandas as pd\n", "import os\n", "from sklearn.tree import DecisionTreeClassifier\n", "from sklearn import preprocessing\n", "from sklearn.metrics import accuracy_score\n", "from sklearn.cross_validation import train_test_split\n", "\n", "print pd.__version__" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Loading Data" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "collapsed": false }, "outputs": [ { "data": { "text/html": [ "
| \n", " | 0 | \n", "1 | \n", "2 | \n", "3 | \n", "4 | \n", "5 | \n", "6 | \n", "7 | \n", "8 | \n", "9 | \n", "10 | \n", "11 | \n", "12 | \n", "13 | \n", "14 | \n", "15 | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "b | \n", "30.83 | \n", "0.000 | \n", "u | \n", "g | \n", "w | \n", "v | \n", "1.25 | \n", "t | \n", "t | \n", "1 | \n", "f | \n", "g | \n", "00202 | \n", "0 | \n", "+ | \n", "
| 1 | \n", "a | \n", "58.67 | \n", "4.460 | \n", "u | \n", "g | \n", "q | \n", "h | \n", "3.04 | \n", "t | \n", "t | \n", "6 | \n", "f | \n", "g | \n", "00043 | \n", "560 | \n", "+ | \n", "
| 2 | \n", "a | \n", "24.50 | \n", "0.500 | \n", "u | \n", "g | \n", "q | \n", "h | \n", "1.50 | \n", "t | \n", "f | \n", "0 | \n", "f | \n", "g | \n", "00280 | \n", "824 | \n", "+ | \n", "
| 3 | \n", "b | \n", "27.83 | \n", "1.540 | \n", "u | \n", "g | \n", "w | \n", "v | \n", "3.75 | \n", "t | \n", "t | \n", "5 | \n", "t | \n", "g | \n", "00100 | \n", "3 | \n", "+ | \n", "
| 4 | \n", "b | \n", "20.17 | \n", "5.625 | \n", "u | \n", "g | \n", "w | \n", "v | \n", "1.71 | \n", "t | \n", "f | \n", "0 | \n", "f | \n", "s | \n", "00120 | \n", "0 | \n", "+ | \n", "