{ "metadata": { "name": "", "signature": "sha256:56e3d62355fc065626699ebb696ceabe03f7b3853b3e204c8e5d63fe0567cb29" }, "nbformat": 3, "nbformat_minor": 0, "worksheets": [ { "cells": [ { "cell_type": "code", "collapsed": false, "input": [ "from numpy import *\n", "import operator\n", "import seaborn as sns\n", "sns.set(context='poster', style='dark')\n", "sns.set_context(rc={'lines.markeredgewidth': 0.5})\n", "import pandas as pd\n", "from mpl_toolkits.mplot3d import Axes3D\n", "\n", "dating_df = pd.read_csv('datingTestSet2.txt', sep='\\t', header=None)\n", "dating_df.columns = ['miles', 'games', 'ice_cream', 'opinion']\n", "\n", "norm_df = pd.DataFrame()\n", "labels = dating_df.columns[:-1]\n", "\n", "for L in labels:\n", " norm_df[L] = (dating_df[L]-dating_df[L].min()) / \\\n", " (dating_df[L].max()-dating_df[L].min())\n", "\n", "norm_df['opinion'] = dating_df.opinion\n", "norm_df.head()" ], "language": "python", "metadata": {}, "outputs": [ { "html": [ "
\n", " | miles | \n", "games | \n", "ice_cream | \n", "opinion | \n", "
---|---|---|---|---|
0 | \n", "0.448325 | \n", "0.398051 | \n", "0.562334 | \n", "3 | \n", "
1 | \n", "0.158733 | \n", "0.341955 | \n", "0.987244 | \n", "2 | \n", "
2 | \n", "0.285429 | \n", "0.068925 | \n", "0.474496 | \n", "1 | \n", "
3 | \n", "0.823201 | \n", "0.628480 | \n", "0.252489 | \n", "1 | \n", "
4 | \n", "0.420102 | \n", "0.079820 | \n", "0.078578 | \n", "1 | \n", "