{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "http://shanghai.sodachallenges.com/data.html" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "ExecuteTime": { "end_time": "2017-07-19T16:12:10.971924", "start_time": "2017-07-19T16:12:10.221101" }, "collapsed": true }, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "ExecuteTime": { "end_time": "2017-07-19T16:14:57.643991", "start_time": "2017-07-19T16:14:57.058263" } }, "outputs": [], "source": [ "df = pd.read_csv('/Users/chengjun/bigdata/soda-2017-sample/2017/Mobike_SODA_Sample/shanghai_sample.csv')" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "ExecuteTime": { "end_time": "2017-07-19T16:15:01.772053", "start_time": "2017-07-19T16:15:01.728675" } }, "outputs": [ { "data": { "text/html": [ "
\n", " | orderid | \n", "bikeid | \n", "userid | \n", "start_time | \n", "start_location_x | \n", "start_location_y | \n", "end_time | \n", "end_location_x | \n", "end_location_y | \n", "track | \n", "
---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "57099 | \n", "4717 | \n", "4717 | \n", "2016-08-02 17:23:43 | \n", "121.410 | \n", "31.306 | \n", "2016-08-02 17:31:08 | \n", "121.402 | \n", "31.311 | \n", "121.402,31.310#121.402,31.311#121.403,31.309#1... | \n", "
1 | \n", "165262 | \n", "413 | \n", "413 | \n", "2016-08-04 20:17:09 | \n", "121.407 | \n", "31.288 | \n", "2016-08-04 20:19:58 | \n", "121.408 | \n", "31.291 | \n", "121.407,31.288#121.408,31.289#121.408,31.290#1... | \n", "
2 | \n", "8023 | \n", "3993 | \n", "3993 | \n", "2016-08-02 08:16:52 | \n", "121.462 | \n", "31.312 | \n", "2016-08-02 08:25:10 | \n", "121.449 | \n", "31.305 | \n", "121.449,31.305#121.450,31.305#121.451,31.305#1... | \n", "
3 | \n", "148871 | \n", "1340 | \n", "1340 | \n", "2016-08-05 18:37:20 | \n", "121.531 | \n", "31.313 | \n", "2016-08-05 18:45:19 | \n", "121.519 | \n", "31.308 | \n", "121.519,31.308#121.519,31.309#121.520,31.309#1... | \n", "
4 | \n", "10222 | \n", "4174 | \n", "4174 | \n", "2016-08-06 11:04:50 | \n", "121.401 | \n", "31.232 | \n", "2016-08-06 11:21:04 | \n", "121.376 | \n", "31.237 | \n", "121.374,31.234#121.375,31.233#121.375,31.235#1... | \n", "