{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": { "collapsed": true }, "outputs": [], "source": [ "from preamble import *\n", "% matplotlib notebook" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Gaussian Processes\n", "# Check out http://scikit-learn.org/dev/modules/gaussian_process.html" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### download data from https://s3.amazonaws.com/tripdata/201307-201402-citibike-tripdata.zip" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "collapsed": false }, "outputs": [], "source": [ "from glob import glob\n", "dfs = []\n", "for file in glob(\"data/citibike/*.csv\"):\n", " dfs.append(pd.read_csv(file))" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "collapsed": false }, "outputs": [], "source": [ "data = pd.concat(dfs)" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "collapsed": false }, "outputs": [ { "data": { "text/plain": [ "Index(['tripduration', 'starttime', 'stoptime', 'start station id',\n", " 'start station name', 'start station latitude',\n", " 'start station longitude', 'end station id', 'end station name',\n", " 'end station latitude', 'end station longitude', 'bikeid', 'usertype',\n", " 'birth year', 'gender'],\n", " dtype='object')" ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "data.columns" ] }, { "cell_type": "code", "execution_count": 5, "metadata": { "collapsed": false }, "outputs": [ { "data": { "text/html": [ "
\n", " | tripduration | \n", "starttime | \n", "stoptime | \n", "start station id | \n", "start station name | \n", "start station latitude | \n", "start station longitude | \n", "end station id | \n", "end station name | \n", "end station latitude | \n", "end station longitude | \n", "bikeid | \n", "usertype | \n", "birth year | \n", "gender | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "326 | \n", "2013-10-01 00:01:08 | \n", "2013-10-01 00:06:34 | \n", "239 | \n", "Willoughby St & Fleet St | \n", "40.691966 | \n", "-73.981302 | \n", "366 | \n", "Clinton Ave & Myrtle Ave | \n", "40.693261 | \n", "-73.968896 | \n", "16052 | \n", "Subscriber | \n", "1982 | \n", "1 | \n", "
1 | \n", "729 | \n", "2013-10-01 00:01:21 | \n", "2013-10-01 00:13:30 | \n", "322 | \n", "Clinton St & Tillary St | \n", "40.696192 | \n", "-73.991218 | \n", "398 | \n", "Atlantic Ave & Furman St | \n", "40.691652 | \n", "-73.999979 | \n", "19412 | \n", "Customer | \n", "\\N | \n", "0 | \n", "
2 | \n", "520 | \n", "2013-10-01 00:01:24 | \n", "2013-10-01 00:10:04 | \n", "174 | \n", "E 25 St & 1 Ave | \n", "40.738177 | \n", "-73.977387 | \n", "403 | \n", "E 2 St & 2 Ave | \n", "40.725029 | \n", "-73.990697 | \n", "19645 | \n", "Subscriber | \n", "1984 | \n", "1 | \n", "
3 | \n", "281 | \n", "2013-10-01 00:01:25 | \n", "2013-10-01 00:06:06 | \n", "430 | \n", "York St & Jay St | \n", "40.701485 | \n", "-73.986569 | \n", "323 | \n", "Lawrence St & Willoughby St | \n", "40.692362 | \n", "-73.986317 | \n", "16992 | \n", "Subscriber | \n", "1985 | \n", "1 | \n", "
4 | \n", "196 | \n", "2013-10-01 00:01:27 | \n", "2013-10-01 00:04:43 | \n", "403 | \n", "E 2 St & 2 Ave | \n", "40.725029 | \n", "-73.990697 | \n", "401 | \n", "Allen St & Rivington St | \n", "40.720196 | \n", "-73.989978 | \n", "15690 | \n", "Subscriber | \n", "1986 | \n", "1 | \n", "