{ "cells": [ { "cell_type": "markdown", "metadata": { "slideshow": { "slide_type": "slide" } }, "source": [ "# Timeseries" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "collapsed": false, "slideshow": { "slide_type": "-" } }, "outputs": [], "source": [ "import numpy as np\n", "import pandas as pd\n", "%matplotlib inline\n", "pd.options.display.max_rows = 12\n", "pd.options.display.max_columns = 8\n", "pd.options.display.width = 80" ] }, { "cell_type": "markdown", "metadata": { "slideshow": { "slide_type": "subslide" } }, "source": [ "nice blog on Seattle bikeshare\n", "\n", "https://jakevdp.github.io/blog/2015/10/17/analyzing-pronto-cycleshare-data-with-python-and-pandas/" ] }, { "cell_type": "markdown", "metadata": { "slideshow": { "slide_type": "fragment" } }, "source": [ "Get the NYC data for Sept 2015\n", "\n", "https://www.citibikenyc.com/system-data\n", "\n", "```\n", "unzip data/201509-citibike-tripdata.zip\n", "```" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "collapsed": false, "slideshow": { "slide_type": "subslide" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\"tripduration\",\"starttime\",\"stoptime\",\"start station id\",\"start station name\",\"start station latitude\",\"start station longitude\",\"end station id\",\"end station name\",\"end station latitude\",\"end station longitude\",\"bikeid\",\"usertype\",\"birth year\",\"gender\"\r", "\r\n", "\"288\",\"9/1/2015 00:00:00\",\"9/1/2015 00:04:48\",\"263\",\"Elizabeth St & Hester St\",\"40.71729\",\"-73.996375\",\"307\",\"Canal St & Rutgers St\",\"40.71427487\",\"-73.98990025\",\"15479\",\"Subscriber\",\"1989\",\"1\"\r", "\r\n", "\"165\",\"9/1/2015 00:00:00\",\"9/1/2015 00:02:45\",\"495\",\"W 47 St & 10 Ave\",\"40.76269882\",\"-73.99301222\",\"449\",\"W 52 St & 9 Ave\",\"40.76461837\",\"-73.98789473\",\"23899\",\"Subscriber\",\"1987\",\"1\"\r", "\r\n", "\"367\",\"9/1/2015 00:00:01\",\"9/1/2015 00:06:08\",\"3119\",\"Vernon Blvd & 50 Ave\",\"40.74232744\",\"-73.95411749\",\"3118\",\"McGuinness Blvd & Eagle St\",\"40.73555\",\"-73.95284\",\"23921\",\"Customer\",\"\",\"0\"\r", "\r\n", "\"926\",\"9/1/2015 00:00:07\",\"9/1/2015 00:15:34\",\"536\",\"1 Ave & E 30 St\",\"40.74144387\",\"-73.97536082\",\"340\",\"Madison St & Clinton St\",\"40.71269042\",\"-73.98776323\",\"23256\",\"Subscriber\",\"1992\",\"1\"\r", "\r", "\r\n" ] } ], "source": [ "!head -5 data/201509-citibike-tripdata.csv" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "collapsed": false, "slideshow": { "slide_type": "subslide" } }, "outputs": [ { "data": { "text/html": [ "
\n", " | tripduration | \n", "starttime | \n", "stoptime | \n", "start station id | \n", "... | \n", "bikeid | \n", "usertype | \n", "birth year | \n", "gender | \n", "
---|---|---|---|---|---|---|---|---|---|
0 | \n", "288 | \n", "2015-09-01 00:00:00 | \n", "2015-09-01 00:04:48 | \n", "263 | \n", "... | \n", "15479 | \n", "Subscriber | \n", "1989 | \n", "1 | \n", "
1 | \n", "165 | \n", "2015-09-01 00:00:00 | \n", "2015-09-01 00:02:45 | \n", "495 | \n", "... | \n", "23899 | \n", "Subscriber | \n", "1987 | \n", "1 | \n", "
2 | \n", "367 | \n", "2015-09-01 00:00:01 | \n", "2015-09-01 00:06:08 | \n", "3119 | \n", "... | \n", "23921 | \n", "Customer | \n", "NaN | \n", "0 | \n", "
3 | \n", "926 | \n", "2015-09-01 00:00:07 | \n", "2015-09-01 00:15:34 | \n", "536 | \n", "... | \n", "23256 | \n", "Subscriber | \n", "1992 | \n", "1 | \n", "
4 | \n", "658 | \n", "2015-09-01 00:00:09 | \n", "2015-09-01 00:11:07 | \n", "347 | \n", "... | \n", "17289 | \n", "Subscriber | \n", "1976 | \n", "1 | \n", "
5 | \n", "392 | \n", "2015-09-01 00:00:13 | \n", "2015-09-01 00:06:46 | \n", "2004 | \n", "... | \n", "15438 | \n", "Subscriber | \n", "1955 | \n", "1 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
1289693 | \n", "203 | \n", "2015-09-30 23:58:56 | \n", "2015-10-01 00:02:19 | \n", "439 | \n", "... | \n", "21305 | \n", "Subscriber | \n", "1982 | \n", "1 | \n", "
1289694 | \n", "1200 | \n", "2015-09-30 23:59:07 | \n", "2015-10-01 00:19:07 | \n", "3082 | \n", "... | \n", "23295 | \n", "Customer | \n", "NaN | \n", "0 | \n", "
1289695 | \n", "1195 | \n", "2015-09-30 23:59:10 | \n", "2015-10-01 00:19:05 | \n", "3082 | \n", "... | \n", "22286 | \n", "Customer | \n", "NaN | \n", "0 | \n", "
1289696 | \n", "652 | \n", "2015-09-30 23:59:44 | \n", "2015-10-01 00:10:37 | \n", "432 | \n", "... | \n", "23486 | \n", "Subscriber | \n", "1979 | \n", "1 | \n", "
1289697 | \n", "1733 | \n", "2015-09-30 23:59:48 | \n", "2015-10-01 00:28:42 | \n", "267 | \n", "... | \n", "23705 | \n", "Subscriber | \n", "1985 | \n", "2 | \n", "
1289698 | \n", "1106 | \n", "2015-09-30 23:59:57 | \n", "2015-10-01 00:18:24 | \n", "228 | \n", "... | \n", "22529 | \n", "Subscriber | \n", "1977 | \n", "1 | \n", "
1289699 rows × 15 columns
\n", "usertype | \n", "Customer | \n", "Subscriber | \n", "
---|---|---|
starttime | \n", "\n", " | \n", " |
2015-09-01 | \n", "4846 | \n", "38445 | \n", "
2015-09-02 | \n", "4683 | \n", "38542 | \n", "
2015-09-03 | \n", "5049 | \n", "37830 | \n", "
2015-09-04 | \n", "6342 | \n", "33614 | \n", "
2015-09-05 | \n", "13052 | \n", "20953 | \n", "
2015-09-06 | \n", "14346 | \n", "18853 | \n", "
... | \n", "... | \n", "... | \n", "
2015-09-25 | \n", "7189 | \n", "44179 | \n", "
2015-09-26 | \n", "11093 | \n", "31467 | \n", "
2015-09-27 | \n", "9162 | \n", "29123 | \n", "
2015-09-28 | \n", "5407 | \n", "42604 | \n", "
2015-09-29 | \n", "4895 | \n", "43830 | \n", "
2015-09-30 | \n", "2804 | \n", "36641 | \n", "
30 rows × 2 columns
\n", "\n", " | days | \n", "hours | \n", "minutes | \n", "seconds | \n", "milliseconds | \n", "microseconds | \n", "nanoseconds | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
1 | \n", "32 | \n", "0 | \n", "0 | \n", "2 | \n", "0 | \n", "0 | \n", "0 | \n", "
2 | \n", "60 | \n", "0 | \n", "0 | \n", "4 | \n", "0 | \n", "0 | \n", "0 | \n", "
3 | \n", "91 | \n", "0 | \n", "0 | \n", "6 | \n", "0 | \n", "0 | \n", "0 | \n", "
4 | \n", "121 | \n", "0 | \n", "0 | \n", "8 | \n", "0 | \n", "0 | \n", "0 | \n", "
\n", " | open | \n", "high | \n", "low | \n", "close | \n", "
---|---|---|---|---|
2013-01-01 09:30:00.000 | \n", "50.050176 | \n", "50.050176 | \n", "50.050176 | \n", "50.050176 | \n", "
2013-01-01 09:30:00.001 | \n", "49.969851 | \n", "50.138129 | \n", "49.969851 | \n", "50.138129 | \n", "
2013-01-01 09:30:00.002 | \n", "49.888302 | \n", "49.888302 | \n", "49.888302 | \n", "49.888302 | \n", "
2013-01-01 09:30:00.003 | \n", "50.017030 | \n", "50.035368 | \n", "50.017030 | \n", "50.035368 | \n", "
2013-01-01 09:30:00.004 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
2013-01-01 09:30:00.005 | \n", "50.062878 | \n", "50.062878 | \n", "49.921889 | \n", "49.921889 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2013-01-01 09:30:00.994 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
2013-01-01 09:30:00.995 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
2013-01-01 09:30:00.996 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
2013-01-01 09:30:00.997 | \n", "49.907617 | \n", "49.907617 | \n", "49.907617 | \n", "49.907617 | \n", "
2013-01-01 09:30:00.998 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
2013-01-01 09:30:00.999 | \n", "49.925853 | \n", "49.925853 | \n", "49.925853 | \n", "49.925853 | \n", "
1000 rows × 4 columns
\n", "\n", " | open | \n", "high | \n", "low | \n", "close | \n", "
---|---|---|---|---|
2013-01-01 09:30:00.000 | \n", "50.050176 | \n", "50.050176 | \n", "50.050176 | \n", "50.050176 | \n", "
2013-01-01 09:30:00.001 | \n", "49.969851 | \n", "50.138129 | \n", "49.969851 | \n", "50.138129 | \n", "
2013-01-01 09:30:00.002 | \n", "49.888302 | \n", "49.888302 | \n", "49.888302 | \n", "49.888302 | \n", "
2013-01-01 09:30:00.003 | \n", "50.017030 | \n", "50.035368 | \n", "50.017030 | \n", "50.035368 | \n", "
2013-01-01 09:30:00.004 | \n", "50.017030 | \n", "50.035368 | \n", "50.017030 | \n", "50.035368 | \n", "
2013-01-01 09:30:00.005 | \n", "50.062878 | \n", "50.062878 | \n", "49.921889 | \n", "49.921889 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2013-01-01 09:30:00.994 | \n", "49.845309 | \n", "50.023058 | \n", "49.845309 | \n", "49.904009 | \n", "
2013-01-01 09:30:00.995 | \n", "49.845309 | \n", "50.023058 | \n", "49.845309 | \n", "49.904009 | \n", "
2013-01-01 09:30:00.996 | \n", "49.845309 | \n", "50.023058 | \n", "49.845309 | \n", "49.904009 | \n", "
2013-01-01 09:30:00.997 | \n", "49.907617 | \n", "49.907617 | \n", "49.907617 | \n", "49.907617 | \n", "
2013-01-01 09:30:00.998 | \n", "49.907617 | \n", "49.907617 | \n", "49.907617 | \n", "49.907617 | \n", "
2013-01-01 09:30:00.999 | \n", "49.925853 | \n", "49.925853 | \n", "49.925853 | \n", "49.925853 | \n", "
1000 rows × 4 columns
\n", "