{ "metadata": { "name": "" }, "nbformat": 3, "nbformat_minor": 0, "worksheets": [ { "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "## Chapter 4: Classification ##" ] }, { "cell_type": "code", "collapsed": false, "input": [ "from __future__ import division\n", "import pandas as pd\n", "import numpy as np\n", "import matplotlib.pyplot as plt\n", "from sklearn.linear_model import LogisticRegression\n", "from sklearn.lda import LDA\n", "from sklearn.neighbors import KNeighborsClassifier\n", "from sklearn.metrics import confusion_matrix\n", "from sklearn.metrics import accuracy_score\n", "%matplotlib inline" ], "language": "python", "metadata": {}, "outputs": [], "prompt_number": 1 }, { "cell_type": "code", "collapsed": false, "input": [ "smarket_df = pd.read_csv(\"../data/Smarket.csv\")\n", "smarket_df.head()" ], "language": "python", "metadata": {}, "outputs": [ { "html": [ "
| \n", " | Year | \n", "Lag1 | \n", "Lag2 | \n", "Lag3 | \n", "Lag4 | \n", "Lag5 | \n", "Volume | \n", "Today | \n", "Direction | \n", "
|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "2001 | \n", "0.381 | \n", "-0.192 | \n", "-2.624 | \n", "-1.055 | \n", "5.010 | \n", "1.1913 | \n", "0.959 | \n", "Up | \n", "
| 1 | \n", "2001 | \n", "0.959 | \n", "0.381 | \n", "-0.192 | \n", "-2.624 | \n", "-1.055 | \n", "1.2965 | \n", "1.032 | \n", "Up | \n", "
| 2 | \n", "2001 | \n", "1.032 | \n", "0.959 | \n", "0.381 | \n", "-0.192 | \n", "-2.624 | \n", "1.4112 | \n", "-0.623 | \n", "Down | \n", "
| 3 | \n", "2001 | \n", "-0.623 | \n", "1.032 | \n", "0.959 | \n", "0.381 | \n", "-0.192 | \n", "1.2760 | \n", "0.614 | \n", "Up | \n", "
| 4 | \n", "2001 | \n", "0.614 | \n", "-0.623 | \n", "1.032 | \n", "0.959 | \n", "0.381 | \n", "1.2057 | \n", "0.213 | \n", "Up | \n", "
5 rows \u00d7 9 columns
\n", "