{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 101,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<script>requirejs.config({paths: { 'plotly': ['https://cdn.plot.ly/plotly-latest.min']},});if(!window.Plotly) {{require(['plotly'],function(plotly) {window.Plotly=plotly;});}}</script>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "import plotly.graph_objs as go\n",
    "from plotly.offline import download_plotlyjs, init_notebook_mode, iplot\n",
    "\n",
    "init_notebook_mode(connected=True)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "We will use the `gbq.read_gbq` function to read BigQuery datasets into Pandas `DataFrame` objects."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 102,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "from pandas.io import gbq"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 103,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "import numpy as np"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "We will use `linregress` function for linear regression of scatter plots."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 104,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "from scipy.stats import linregress"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Data Collection"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Read the post [Using Google BigQuery with Plotly and Pandas](moderndata.plot.ly/using-google-bigquery-with-plotly-and-pandas/) to create a new project."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 105,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "project_id = 'sixth-edition-678'"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "This query will collect the `timestamp`, `package name`, and `total download count` columns from the table (on a daily basis)."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 106,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "daily_download_query = \"\"\"\n",
    "SELECT\n",
    "  DATE(timestamp) as day,\n",
    "  MONTH(timestamp) as month,\n",
    "  file.project,\n",
    "  COUNT(*) as total_downloads,\n",
    "FROM\n",
    "  TABLE_DATE_RANGE(\n",
    "    [the-psf:pypi.downloads],\n",
    "    TIMESTAMP(\"20120701\"),\n",
    "    CURRENT_TIMESTAMP()\n",
    "  )\n",
    "WHERE\n",
    "  file.project = '{0}'\n",
    "GROUP BY\n",
    "  day, file.project, month\n",
    "ORDER BY\n",
    "  day asc\n",
    "\"\"\""
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "The following function run the query and returns a DataFrame object, if successful."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 107,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "def package_df(package):\n",
    "    \"\"\" Return the query result as a pandas.DataFrame object\n",
    "    \n",
    "    param: package(str): Name of the package on PyPI\n",
    "    \"\"\"\n",
    "    \n",
    "    try:\n",
    "        df = gbq.read_gbq(daily_download_query.format(package), project_id=project_id)\n",
    "        return df\n",
    "    except:\n",
    "        raise IOError"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "We will construct different DataFrames for each package."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 108,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Requesting query... ok.\n",
      "Query running...\n",
      "Query done.\n",
      "Processed: 35.8 Gb\n",
      "\n",
      "Retrieving results...\n",
      "  Got page: 1; 100.0% done. Elapsed 13.68 s.\n",
      "Got 144 rows.\n",
      "\n",
      "Total time taken 14.04 s.\n",
      "Finished at 2016-08-29 13:04:38.\n"
     ]
    }
   ],
   "source": [
    "plotly_df = package_df('plotly')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 109,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Requesting query... ok.\n",
      "Query running...\n",
      "Query done.\n",
      "Processed: 35.8 Gb\n",
      "\n",
      "Retrieving results...\n",
      "  Got page: 1; 100.0% done. Elapsed 15.13 s.\n",
      "Got 144 rows.\n",
      "\n",
      "Total time taken 15.15 s.\n",
      "Finished at 2016-08-29 13:04:53.\n"
     ]
    }
   ],
   "source": [
    "bokeh_df = package_df('bokeh')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 110,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Requesting query... ok.\n",
      "Query running...\n",
      "  Elapsed 14.52 s. Waiting...\n",
      "Query done.\n",
      "Processed: 35.8 Gb\n",
      "\n",
      "Retrieving results...\n",
      "  Got page: 1; 100.0% done. Elapsed 15.37 s.\n",
      "Got 144 rows.\n",
      "\n",
      "Total time taken 15.39 s.\n",
      "Finished at 2016-08-29 13:05:09.\n"
     ]
    }
   ],
   "source": [
    "matplotlib_df = package_df('matplotlib')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 111,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Requesting query... ok.\n",
      "Query running...\n",
      "Query done.\n",
      "Processed: 35.8 Gb\n",
      "\n",
      "Retrieving results...\n",
      "  Got page: 1; 100.0% done. Elapsed 13.45 s.\n",
      "Got 144 rows.\n",
      "\n",
      "Total time taken 13.47 s.\n",
      "Finished at 2016-08-29 13:05:22.\n"
     ]
    }
   ],
   "source": [
    "mpld3_df = package_df('mpld3')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 112,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Requesting query... ok.\n",
      "Query running...\n",
      "Query done.\n",
      "Processed: 35.8 Gb\n",
      "\n",
      "Retrieving results...\n",
      "  Got page: 1; 100.0% done. Elapsed 14.06 s.\n",
      "Got 144 rows.\n",
      "\n",
      "Total time taken 14.08 s.\n",
      "Finished at 2016-08-29 13:05:36.\n"
     ]
    }
   ],
   "source": [
    "vincent_df = package_df('vincent')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Inspection for Missing Data"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Using a simple `TimeDelta` calculation, we can find if some rows are missing from the DataFrame."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 113,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "77 rows are missing in the DataFrame.\n"
     ]
    }
   ],
   "source": [
    "from datetime import datetime, timedelta\n",
    "\n",
    "# Number of rows in the DataFrame\n",
    "actual_rows = len(plotly_df)\n",
    "\n",
    "start_date = datetime.strptime(plotly_df.iloc[0]['day'], '%Y-%m-%d') # 2016-01-22\n",
    "end_date = datetime.strptime(plotly_df.iloc[actual_rows - 1]['day'], '%Y-%m-%d') # 2016-08-29\n",
    "\n",
    "# Expected rows if there was no missing data (day)\n",
    "expected_rows = (end_date - start_date).days + 1\n",
    "\n",
    "if (actual_rows != expected_rows):\n",
    "    print \"{0} rows are missing in the DataFrame.\".format(expected_rows - actual_rows)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "We find that there are no rows from **2016-03-06** to **2016-05-21**."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Data Transformation\n",
    "\n",
    "Here, we will concate the missing values in the DataFrames."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 118,
   "metadata": {
    "collapsed": false
   },
   "outputs": [],
   "source": [
    "missing_data_start_date = '2016-03-06'\n",
    "missing_data_end_date = '2016-05-21'\n",
    "\n",
    "# starting/ending date for missing data and time differene (1 day)\n",
    "s = datetime.strptime(missing_data_start_date, '%Y-%m-%d')\n",
    "e = datetime.strptime(missing_data_end_date, '%Y-%m-%d')\n",
    "diff = timedelta(days=1)\n",
    "\n",
    "# generate all the missing dates in the same format\n",
    "missing_dates = []\n",
    "missing_dates_month = []\n",
    "\n",
    "while (s <= e):\n",
    "    missing_dates.append(s.strftime('%Y-%m-%d'))\n",
    "    missing_dates_month.append(int(s.strftime('%m')[1]))\n",
    "    s += diff\n",
    "    \n",
    "missing_row_count = len(missing_dates) # 77"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 123,
   "metadata": {
    "collapsed": false
   },
   "outputs": [],
   "source": [
    "def append_missing_data(dataframe, package):\n",
    "    \"\"\"Append the missing dates DataFrame to a given DataFrame\n",
    "    \n",
    "    param: dataframe(pandas.DataFrame): DataFrame to append\n",
    "    param: package(str): Name of package on PyPI\n",
    "    \"\"\"\n",
    "    \n",
    "    missing_dates_df = pd.DataFrame({'day': missing_dates,\n",
    "                                    'month': missing_dates_month,\n",
    "                                    'file_project': [package for i in range(missing_row_count)],\n",
    "                                    'total_downloads': [0 for i in range(missing_row_count)]}\n",
    "                                   )\n",
    "    \n",
    "    # place the appended columns at their right place by sorting\n",
    "    new_df = pd.concat([dataframe, missing_dates_df])\n",
    "    \n",
    "    return new_df.sort_values('day')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Updated DataFrames with the recovered missing data."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 127,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "bokeh_df = append_missing_data(bokeh_df, 'bokeh')\n",
    "matplotlib_df = append_missing_data(matplotlib_df, 'matplotlib')\n",
    "mpld3_df = append_missing_data(mpld3_df, 'mpld3')\n",
    "plotly_df = append_missing_data(plotly_df, 'plotly')\n",
    "vincent_df = append_missing_data(vincent_df, 'vincent')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Package Downloads Comparison (Daily)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 128,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div id=\"46e97236-73d8-4735-bf2a-29d655f4a56f\" style=\"height: 525px; width: 100%;\" class=\"plotly-graph-div\"></div><script type=\"text/javascript\">require([\"plotly\"], function(Plotly) { window.PLOTLYENV=window.PLOTLYENV || {};window.PLOTLYENV.BASE_URL=\"https://plot.ly\";Plotly.newPlot(\"46e97236-73d8-4735-bf2a-29d655f4a56f\", [{\"name\": \"Plotly\", \"mode\": \"lines\", \"y\": [801, 334, 480, 762, 817, 1373, 653, 718, 489, 364, 900, 830, 750, 1014, 1151, 472, 556, 689, 1124, 738, 983, 880, 513, 392, 632, 950, 1092, 980, 1308, 627, 484, 880, 1433, 1207, 1643, 1014, 901, 782, 995, 1478, 1225, 1099, 1110, 1096, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1054, 1738, 1622, 1814, 2226, 2172, 1189, 866, 1623, 1642, 2464, 2361, 2000, 1645, 1002, 2013, 2416, 1972, 1546, 2812, 874, 726, 2204, 2525, 1613, 1500, 1832, 934, 711, 1944, 1724, 1851, 2628, 1790, 1001, 1075, 1504, 1542, 1619, 2215, 1615, 1154, 787, 1111, 1359, 2244, 2006, 2260, 1895, 1092, 2300, 2432, 2378, 3063, 2521, 1546, 1195, 2368, 2673, 2458, 3163, 2499, 1095, 814, 2182, 2655, 2515, 3089, 2869, 969, 1031, 2110, 2851, 2759, 2871, 3139, 1331, 1236, 2936, 3010, 3667, 2534, 3227, 1271, 1101, 2517, 2575, 4068, 3102, 2826, 2195, 1224, 2708, 3134, 2556, 3085, 9340, 8579, 8098, 2763], \"x\": [\"2016-01-22\", \"2016-01-23\", \"2016-01-24\", \"2016-01-25\", \"2016-01-26\", \"2016-01-27\", \"2016-01-28\", \"2016-01-29\", \"2016-01-30\", \"2016-01-31\", \"2016-02-01\", \"2016-02-02\", \"2016-02-03\", \"2016-02-04\", \"2016-02-05\", \"2016-02-06\", \"2016-02-07\", \"2016-02-08\", \"2016-02-09\", \"2016-02-10\", \"2016-02-11\", \"2016-02-12\", \"2016-02-13\", \"2016-02-14\", \"2016-02-15\", \"2016-02-16\", \"2016-02-17\", \"2016-02-18\", \"2016-02-19\", \"2016-02-20\", \"2016-02-21\", \"2016-02-22\", \"2016-02-23\", \"2016-02-24\", \"2016-02-25\", \"2016-02-26\", \"2016-02-27\", \"2016-02-28\", \"2016-02-29\", \"2016-03-01\", \"2016-03-02\", \"2016-03-03\", \"2016-03-04\", \"2016-03-05\", \"2016-03-06\", \"2016-03-07\", \"2016-03-08\", \"2016-03-09\", \"2016-03-10\", \"2016-03-11\", \"2016-03-12\", \"2016-03-13\", \"2016-03-14\", \"2016-03-15\", \"2016-03-16\", \"2016-03-17\", \"2016-03-18\", \"2016-03-19\", \"2016-03-20\", \"2016-03-21\", \"2016-03-22\", \"2016-03-23\", \"2016-03-24\", \"2016-03-25\", \"2016-03-26\", \"2016-03-27\", \"2016-03-28\", \"2016-03-29\", \"2016-03-30\", \"2016-03-31\", \"2016-04-01\", \"2016-04-02\", \"2016-04-03\", \"2016-04-04\", \"2016-04-05\", \"2016-04-06\", \"2016-04-07\", \"2016-04-08\", \"2016-04-09\", \"2016-04-10\", \"2016-04-11\", \"2016-04-12\", \"2016-04-13\", \"2016-04-14\", \"2016-04-15\", \"2016-04-16\", \"2016-04-17\", \"2016-04-18\", \"2016-04-19\", \"2016-04-20\", \"2016-04-21\", \"2016-04-22\", \"2016-04-23\", \"2016-04-24\", \"2016-04-25\", \"2016-04-26\", \"2016-04-27\", \"2016-04-28\", \"2016-04-29\", \"2016-04-30\", \"2016-05-01\", \"2016-05-02\", \"2016-05-03\", \"2016-05-04\", \"2016-05-05\", \"2016-05-06\", \"2016-05-07\", \"2016-05-08\", \"2016-05-09\", \"2016-05-10\", \"2016-05-11\", \"2016-05-12\", \"2016-05-13\", \"2016-05-14\", \"2016-05-15\", \"2016-05-16\", \"2016-05-17\", \"2016-05-18\", \"2016-05-19\", \"2016-05-20\", \"2016-05-21\", \"2016-05-22\", \"2016-05-23\", \"2016-05-24\", \"2016-05-25\", \"2016-05-26\", \"2016-05-27\", \"2016-05-28\", \"2016-05-29\", \"2016-05-30\", \"2016-05-31\", \"2016-06-01\", \"2016-06-02\", \"2016-06-03\", \"2016-06-04\", \"2016-06-05\", \"2016-06-06\", \"2016-06-07\", \"2016-06-08\", \"2016-06-09\", \"2016-06-10\", \"2016-06-11\", \"2016-06-12\", \"2016-06-13\", \"2016-06-14\", \"2016-06-15\", \"2016-06-16\", \"2016-06-17\", \"2016-06-18\", \"2016-06-19\", \"2016-06-20\", \"2016-06-21\", \"2016-06-22\", \"2016-06-23\", \"2016-06-24\", \"2016-06-25\", \"2016-06-26\", \"2016-06-27\", \"2016-06-28\", \"2016-06-29\", \"2016-06-30\", \"2016-07-01\", \"2016-07-02\", \"2016-07-03\", \"2016-07-04\", \"2016-07-05\", \"2016-07-06\", \"2016-07-07\", \"2016-07-08\", \"2016-07-09\", \"2016-07-10\", \"2016-07-11\", \"2016-07-12\", \"2016-07-13\", \"2016-07-14\", \"2016-07-15\", \"2016-07-16\", \"2016-07-17\", \"2016-07-18\", \"2016-07-19\", \"2016-07-20\", \"2016-07-21\", \"2016-07-22\", \"2016-07-23\", \"2016-07-24\", \"2016-07-25\", \"2016-07-26\", \"2016-07-27\", \"2016-07-28\", \"2016-07-29\", \"2016-07-30\", \"2016-07-31\", \"2016-08-01\", \"2016-08-02\", \"2016-08-03\", \"2016-08-04\", \"2016-08-05\", \"2016-08-06\", \"2016-08-07\", \"2016-08-08\", \"2016-08-09\", \"2016-08-10\", \"2016-08-11\", \"2016-08-12\", \"2016-08-13\", \"2016-08-14\", \"2016-08-15\", \"2016-08-16\", \"2016-08-17\", \"2016-08-18\", \"2016-08-19\", \"2016-08-20\", \"2016-08-21\", \"2016-08-22\", \"2016-08-23\", \"2016-08-24\", \"2016-08-25\", \"2016-08-26\", \"2016-08-27\", \"2016-08-28\", \"2016-08-29\"], \"line\": {\"color\": \"rgb(10. 240, 10)\", \"width\": 0.5}, \"type\": \"scatter\", \"fill\": \"tonexty\"}, {\"name\": \"Bokeh\", \"mode\": \"lines\", \"y\": [426, 264, 228, 362, 498, 543, 354, 372, 206, 206, 367, 310, 441, 665, 573, 226, 281, 368, 485, 476, 511, 327, 237, 208, 573, 361, 504, 427, 559, 285, 215, 418, 511, 490, 576, 434, 258, 210, 438, 532, 580, 474, 478, 250, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 328, 685, 698, 826, 655, 532, 377, 245, 533, 536, 868, 804, 587, 427, 253, 723, 878, 633, 3047, 975, 412, 310, 625, 559, 580, 523, 799, 226, 286, 588, 678, 707, 914, 526, 137, 225, 567, 1152, 852, 687, 786, 235, 296, 464, 624, 624, 612, 865, 341, 300, 592, 751, 675, 986, 829, 338, 313, 791, 1017, 862, 831, 739, 389, 268, 826, 802, 950, 1157, 1007, 548, 494, 994, 1060, 717, 851, 802, 421, 424, 740, 855, 1020, 852, 639, 258, 247, 577, 796, 720, 1173, 897, 677, 348, 859, 747, 715, 876, 923, 355, 250, 96], \"x\": [\"2016-01-22\", \"2016-01-23\", \"2016-01-24\", \"2016-01-25\", \"2016-01-26\", \"2016-01-27\", \"2016-01-28\", \"2016-01-29\", \"2016-01-30\", \"2016-01-31\", \"2016-02-01\", \"2016-02-02\", \"2016-02-03\", \"2016-02-04\", \"2016-02-05\", \"2016-02-06\", \"2016-02-07\", \"2016-02-08\", \"2016-02-09\", \"2016-02-10\", \"2016-02-11\", \"2016-02-12\", \"2016-02-13\", \"2016-02-14\", \"2016-02-15\", \"2016-02-16\", \"2016-02-17\", \"2016-02-18\", \"2016-02-19\", \"2016-02-20\", \"2016-02-21\", \"2016-02-22\", \"2016-02-23\", \"2016-02-24\", \"2016-02-25\", \"2016-02-26\", \"2016-02-27\", \"2016-02-28\", \"2016-02-29\", \"2016-03-01\", \"2016-03-02\", \"2016-03-03\", \"2016-03-04\", \"2016-03-05\", \"2016-03-06\", \"2016-03-07\", \"2016-03-08\", \"2016-03-09\", \"2016-03-10\", \"2016-03-11\", \"2016-03-12\", \"2016-03-13\", \"2016-03-14\", \"2016-03-15\", \"2016-03-16\", \"2016-03-17\", \"2016-03-18\", \"2016-03-19\", \"2016-03-20\", \"2016-03-21\", \"2016-03-22\", \"2016-03-23\", \"2016-03-24\", \"2016-03-25\", \"2016-03-26\", \"2016-03-27\", \"2016-03-28\", \"2016-03-29\", \"2016-03-30\", \"2016-03-31\", \"2016-04-01\", \"2016-04-02\", \"2016-04-03\", \"2016-04-04\", \"2016-04-05\", \"2016-04-06\", \"2016-04-07\", \"2016-04-08\", \"2016-04-09\", \"2016-04-10\", \"2016-04-11\", \"2016-04-12\", \"2016-04-13\", \"2016-04-14\", \"2016-04-15\", \"2016-04-16\", \"2016-04-17\", \"2016-04-18\", \"2016-04-19\", \"2016-04-20\", \"2016-04-21\", \"2016-04-22\", \"2016-04-23\", \"2016-04-24\", \"2016-04-25\", \"2016-04-26\", \"2016-04-27\", \"2016-04-28\", \"2016-04-29\", \"2016-04-30\", \"2016-05-01\", \"2016-05-02\", \"2016-05-03\", \"2016-05-04\", \"2016-05-05\", \"2016-05-06\", \"2016-05-07\", \"2016-05-08\", \"2016-05-09\", \"2016-05-10\", \"2016-05-11\", \"2016-05-12\", \"2016-05-13\", \"2016-05-14\", \"2016-05-15\", \"2016-05-16\", \"2016-05-17\", \"2016-05-18\", \"2016-05-19\", \"2016-05-20\", \"2016-05-21\", \"2016-05-22\", \"2016-05-23\", \"2016-05-24\", \"2016-05-25\", \"2016-05-26\", \"2016-05-27\", \"2016-05-28\", \"2016-05-29\", \"2016-05-30\", \"2016-05-31\", \"2016-06-01\", \"2016-06-02\", \"2016-06-03\", \"2016-06-04\", \"2016-06-05\", \"2016-06-06\", \"2016-06-07\", \"2016-06-08\", \"2016-06-09\", \"2016-06-10\", \"2016-06-11\", \"2016-06-12\", \"2016-06-13\", \"2016-06-14\", \"2016-06-15\", \"2016-06-16\", \"2016-06-17\", \"2016-06-18\", \"2016-06-19\", \"2016-06-20\", \"2016-06-21\", \"2016-06-22\", \"2016-06-23\", \"2016-06-24\", \"2016-06-25\", \"2016-06-26\", \"2016-06-27\", \"2016-06-28\", \"2016-06-29\", \"2016-06-30\", \"2016-07-01\", \"2016-07-02\", \"2016-07-03\", \"2016-07-04\", \"2016-07-05\", \"2016-07-06\", \"2016-07-07\", \"2016-07-08\", \"2016-07-09\", \"2016-07-10\", \"2016-07-11\", \"2016-07-12\", \"2016-07-13\", \"2016-07-14\", \"2016-07-15\", \"2016-07-16\", \"2016-07-17\", \"2016-07-18\", \"2016-07-19\", \"2016-07-20\", \"2016-07-21\", \"2016-07-22\", \"2016-07-23\", \"2016-07-24\", \"2016-07-25\", \"2016-07-26\", \"2016-07-27\", \"2016-07-28\", \"2016-07-29\", \"2016-07-30\", \"2016-07-31\", \"2016-08-01\", \"2016-08-02\", \"2016-08-03\", \"2016-08-04\", \"2016-08-05\", \"2016-08-06\", \"2016-08-07\", \"2016-08-08\", \"2016-08-09\", \"2016-08-10\", \"2016-08-11\", \"2016-08-12\", \"2016-08-13\", \"2016-08-14\", \"2016-08-15\", \"2016-08-16\", \"2016-08-17\", \"2016-08-18\", \"2016-08-19\", \"2016-08-20\", \"2016-08-21\", \"2016-08-22\", \"2016-08-23\", \"2016-08-24\", \"2016-08-25\", \"2016-08-26\", \"2016-08-27\", \"2016-08-28\", \"2016-08-29\"], \"line\": {\"color\": \"rgb(42, 77, 20)\", \"width\": 0.5}, \"type\": \"scatter\", \"fill\": \"tonexty\"}, {\"name\": \"MPLD3\", \"mode\": \"lines\", \"y\": [97, 43, 43, 115, 151, 115, 125, 93, 73, 60, 123, 140, 133, 129, 111, 37, 31, 109, 120, 149, 101, 92, 31, 45, 83, 119, 109, 118, 146, 99, 110, 128, 145, 172, 119, 105, 53, 52, 105, 115, 136, 136, 135, 106, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 70, 187, 120, 146, 157, 141, 59, 49, 143, 174, 146, 127, 152, 53, 52, 101, 139, 95, 111, 109, 53, 52, 116, 178, 120, 203, 174, 43, 54, 185, 231, 191, 203, 260, 61, 67, 150, 155, 89, 153, 133, 76, 61, 100, 189, 240, 105, 143, 71, 64, 140, 206, 186, 211, 351, 171, 67, 322, 275, 248, 277, 248, 82, 109, 148, 255, 247, 250, 227, 63, 79, 182, 231, 148, 216, 156, 70, 61, 172, 319, 302, 229, 219, 95, 68, 201, 232, 257, 215, 242, 85, 68, 159, 162, 198, 322, 541, 71, 74, 28], \"x\": [\"2016-01-22\", \"2016-01-23\", \"2016-01-24\", \"2016-01-25\", \"2016-01-26\", \"2016-01-27\", \"2016-01-28\", \"2016-01-29\", \"2016-01-30\", \"2016-01-31\", \"2016-02-01\", \"2016-02-02\", \"2016-02-03\", \"2016-02-04\", \"2016-02-05\", \"2016-02-06\", \"2016-02-07\", \"2016-02-08\", \"2016-02-09\", \"2016-02-10\", \"2016-02-11\", \"2016-02-12\", \"2016-02-13\", \"2016-02-14\", \"2016-02-15\", \"2016-02-16\", \"2016-02-17\", \"2016-02-18\", \"2016-02-19\", \"2016-02-20\", \"2016-02-21\", \"2016-02-22\", \"2016-02-23\", \"2016-02-24\", \"2016-02-25\", \"2016-02-26\", \"2016-02-27\", \"2016-02-28\", \"2016-02-29\", \"2016-03-01\", \"2016-03-02\", \"2016-03-03\", \"2016-03-04\", \"2016-03-05\", \"2016-03-06\", \"2016-03-07\", \"2016-03-08\", \"2016-03-09\", \"2016-03-10\", \"2016-03-11\", \"2016-03-12\", \"2016-03-13\", \"2016-03-14\", \"2016-03-15\", \"2016-03-16\", \"2016-03-17\", \"2016-03-18\", \"2016-03-19\", \"2016-03-20\", \"2016-03-21\", \"2016-03-22\", \"2016-03-23\", \"2016-03-24\", \"2016-03-25\", \"2016-03-26\", \"2016-03-27\", \"2016-03-28\", \"2016-03-29\", \"2016-03-30\", \"2016-03-31\", \"2016-04-01\", \"2016-04-02\", \"2016-04-03\", \"2016-04-04\", \"2016-04-05\", \"2016-04-06\", \"2016-04-07\", \"2016-04-08\", \"2016-04-09\", \"2016-04-10\", \"2016-04-11\", \"2016-04-12\", \"2016-04-13\", \"2016-04-14\", \"2016-04-15\", \"2016-04-16\", \"2016-04-17\", \"2016-04-18\", \"2016-04-19\", \"2016-04-20\", \"2016-04-21\", \"2016-04-22\", \"2016-04-23\", \"2016-04-24\", \"2016-04-25\", \"2016-04-26\", \"2016-04-27\", \"2016-04-28\", \"2016-04-29\", \"2016-04-30\", \"2016-05-01\", \"2016-05-02\", \"2016-05-03\", \"2016-05-04\", \"2016-05-05\", \"2016-05-06\", \"2016-05-07\", \"2016-05-08\", \"2016-05-09\", \"2016-05-10\", \"2016-05-11\", \"2016-05-12\", \"2016-05-13\", \"2016-05-14\", \"2016-05-15\", \"2016-05-16\", \"2016-05-17\", \"2016-05-18\", \"2016-05-19\", \"2016-05-20\", \"2016-05-21\", \"2016-05-22\", \"2016-05-23\", \"2016-05-24\", \"2016-05-25\", \"2016-05-26\", \"2016-05-27\", \"2016-05-28\", \"2016-05-29\", \"2016-05-30\", \"2016-05-31\", \"2016-06-01\", \"2016-06-02\", \"2016-06-03\", \"2016-06-04\", \"2016-06-05\", \"2016-06-06\", \"2016-06-07\", \"2016-06-08\", \"2016-06-09\", \"2016-06-10\", \"2016-06-11\", \"2016-06-12\", \"2016-06-13\", \"2016-06-14\", \"2016-06-15\", \"2016-06-16\", \"2016-06-17\", \"2016-06-18\", \"2016-06-19\", \"2016-06-20\", \"2016-06-21\", \"2016-06-22\", \"2016-06-23\", \"2016-06-24\", \"2016-06-25\", \"2016-06-26\", \"2016-06-27\", \"2016-06-28\", \"2016-06-29\", \"2016-06-30\", \"2016-07-01\", \"2016-07-02\", \"2016-07-03\", \"2016-07-04\", \"2016-07-05\", \"2016-07-06\", \"2016-07-07\", \"2016-07-08\", \"2016-07-09\", \"2016-07-10\", \"2016-07-11\", \"2016-07-12\", \"2016-07-13\", \"2016-07-14\", \"2016-07-15\", \"2016-07-16\", \"2016-07-17\", \"2016-07-18\", \"2016-07-19\", \"2016-07-20\", \"2016-07-21\", \"2016-07-22\", \"2016-07-23\", \"2016-07-24\", \"2016-07-25\", \"2016-07-26\", \"2016-07-27\", \"2016-07-28\", \"2016-07-29\", \"2016-07-30\", \"2016-07-31\", \"2016-08-01\", \"2016-08-02\", \"2016-08-03\", \"2016-08-04\", \"2016-08-05\", \"2016-08-06\", \"2016-08-07\", \"2016-08-08\", \"2016-08-09\", \"2016-08-10\", \"2016-08-11\", \"2016-08-12\", \"2016-08-13\", \"2016-08-14\", \"2016-08-15\", \"2016-08-16\", \"2016-08-17\", \"2016-08-18\", \"2016-08-19\", \"2016-08-20\", \"2016-08-21\", \"2016-08-22\", \"2016-08-23\", \"2016-08-24\", \"2016-08-25\", \"2016-08-26\", \"2016-08-27\", \"2016-08-28\", \"2016-08-29\"], \"line\": {\"color\": \"rgb(20, 33, 61)\", \"width\": 0.5}, \"type\": \"scatter\", \"fill\": \"tonexty\"}, {\"name\": \"Vincent\", \"mode\": \"lines\", \"y\": [49, 31, 71, 40, 61, 119, 97, 47, 47, 47, 102, 55, 50, 57, 97, 37, 66, 49, 59, 51, 67, 54, 74, 31, 67, 100, 104, 59, 125, 19, 54, 54, 85, 59, 117, 93, 103, 41, 81, 148, 74, 84, 60, 104, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 68, 135, 156, 160, 107, 125, 94, 52, 87, 175, 135, 160, 155, 130, 64, 79, 144, 106, 77, 69, 88, 57, 110, 153, 79, 122, 160, 107, 80, 102, 139, 161, 194, 163, 87, 74, 92, 100, 123, 187, 149, 71, 119, 73, 143, 161, 115, 89, 86, 79, 119, 135, 135, 167, 157, 82, 94, 142, 187, 106, 135, 153, 57, 71, 86, 105, 176, 223, 161, 76, 96, 126, 166, 145, 129, 171, 145, 117, 125, 140, 178, 86, 134, 95, 78, 90, 163, 187, 159, 143, 133, 93, 109, 106, 86, 169, 489, 115, 68, 39], \"x\": [\"2016-01-22\", \"2016-01-23\", \"2016-01-24\", \"2016-01-25\", \"2016-01-26\", \"2016-01-27\", \"2016-01-28\", \"2016-01-29\", \"2016-01-30\", \"2016-01-31\", \"2016-02-01\", \"2016-02-02\", \"2016-02-03\", \"2016-02-04\", \"2016-02-05\", \"2016-02-06\", \"2016-02-07\", \"2016-02-08\", \"2016-02-09\", \"2016-02-10\", \"2016-02-11\", \"2016-02-12\", \"2016-02-13\", \"2016-02-14\", \"2016-02-15\", \"2016-02-16\", \"2016-02-17\", \"2016-02-18\", \"2016-02-19\", \"2016-02-20\", \"2016-02-21\", \"2016-02-22\", \"2016-02-23\", \"2016-02-24\", \"2016-02-25\", \"2016-02-26\", \"2016-02-27\", \"2016-02-28\", \"2016-02-29\", \"2016-03-01\", \"2016-03-02\", \"2016-03-03\", \"2016-03-04\", \"2016-03-05\", \"2016-03-06\", \"2016-03-07\", \"2016-03-08\", \"2016-03-09\", \"2016-03-10\", \"2016-03-11\", \"2016-03-12\", \"2016-03-13\", \"2016-03-14\", \"2016-03-15\", \"2016-03-16\", \"2016-03-17\", \"2016-03-18\", \"2016-03-19\", \"2016-03-20\", \"2016-03-21\", \"2016-03-22\", \"2016-03-23\", \"2016-03-24\", \"2016-03-25\", \"2016-03-26\", \"2016-03-27\", \"2016-03-28\", \"2016-03-29\", \"2016-03-30\", \"2016-03-31\", \"2016-04-01\", \"2016-04-02\", \"2016-04-03\", \"2016-04-04\", \"2016-04-05\", \"2016-04-06\", \"2016-04-07\", \"2016-04-08\", \"2016-04-09\", \"2016-04-10\", \"2016-04-11\", \"2016-04-12\", \"2016-04-13\", \"2016-04-14\", \"2016-04-15\", \"2016-04-16\", \"2016-04-17\", \"2016-04-18\", \"2016-04-19\", \"2016-04-20\", \"2016-04-21\", \"2016-04-22\", \"2016-04-23\", \"2016-04-24\", \"2016-04-25\", \"2016-04-26\", \"2016-04-27\", \"2016-04-28\", \"2016-04-29\", \"2016-04-30\", \"2016-05-01\", \"2016-05-02\", \"2016-05-03\", \"2016-05-04\", \"2016-05-05\", \"2016-05-06\", \"2016-05-07\", \"2016-05-08\", \"2016-05-09\", \"2016-05-10\", \"2016-05-11\", \"2016-05-12\", \"2016-05-13\", \"2016-05-14\", \"2016-05-15\", \"2016-05-16\", \"2016-05-17\", \"2016-05-18\", \"2016-05-19\", \"2016-05-20\", \"2016-05-21\", \"2016-05-22\", \"2016-05-23\", \"2016-05-24\", \"2016-05-25\", \"2016-05-26\", \"2016-05-27\", \"2016-05-28\", \"2016-05-29\", \"2016-05-30\", \"2016-05-31\", \"2016-06-01\", \"2016-06-02\", \"2016-06-03\", \"2016-06-04\", \"2016-06-05\", \"2016-06-06\", \"2016-06-07\", \"2016-06-08\", \"2016-06-09\", \"2016-06-10\", \"2016-06-11\", \"2016-06-12\", \"2016-06-13\", \"2016-06-14\", \"2016-06-15\", \"2016-06-16\", \"2016-06-17\", \"2016-06-18\", \"2016-06-19\", \"2016-06-20\", \"2016-06-21\", \"2016-06-22\", \"2016-06-23\", \"2016-06-24\", \"2016-06-25\", \"2016-06-26\", \"2016-06-27\", \"2016-06-28\", \"2016-06-29\", \"2016-06-30\", \"2016-07-01\", \"2016-07-02\", \"2016-07-03\", \"2016-07-04\", \"2016-07-05\", \"2016-07-06\", \"2016-07-07\", \"2016-07-08\", \"2016-07-09\", \"2016-07-10\", \"2016-07-11\", \"2016-07-12\", \"2016-07-13\", \"2016-07-14\", \"2016-07-15\", \"2016-07-16\", \"2016-07-17\", \"2016-07-18\", \"2016-07-19\", \"2016-07-20\", \"2016-07-21\", \"2016-07-22\", \"2016-07-23\", \"2016-07-24\", \"2016-07-25\", \"2016-07-26\", \"2016-07-27\", \"2016-07-28\", \"2016-07-29\", \"2016-07-30\", \"2016-07-31\", \"2016-08-01\", \"2016-08-02\", \"2016-08-03\", \"2016-08-04\", \"2016-08-05\", \"2016-08-06\", \"2016-08-07\", \"2016-08-08\", \"2016-08-09\", \"2016-08-10\", \"2016-08-11\", \"2016-08-12\", \"2016-08-13\", \"2016-08-14\", \"2016-08-15\", \"2016-08-16\", \"2016-08-17\", \"2016-08-18\", \"2016-08-19\", \"2016-08-20\", \"2016-08-21\", \"2016-08-22\", \"2016-08-23\", \"2016-08-24\", \"2016-08-25\", \"2016-08-26\", \"2016-08-27\", \"2016-08-28\", \"2016-08-29\"], \"line\": {\"color\": \"rgb(0, 0, 0)\", \"width\": 0.5}, \"type\": \"scatter\", \"fill\": \"tonexty\"}], {\"showlegend\": true, \"yaxis\": {\"range\": [1, 10000], \"type\": \"linear\", \"title\": \"No. of downloads (daily)\"}, \"plot_bgcolor\": \"rgba(250, 250, 250, 1)\", \"title\": \"Package Downloads Comparison (Daily)\", \"shapes\": [{\"xref\": \"x\", \"yref\": \"y\", \"y1\": \"2000\", \"y0\": \"2000\", \"x0\": \"45\", \"x1\": \"120\", \"type\": \"line\"}], \"xaxis\": {\"type\": \"category\", \"showgrid\": false}, \"annotations\": [{\"xref\": \"x\", \"yref\": \"y\", \"text\": \"PyPI's stats collection service was down from March 6 to May 21\", \"y\": 2400, \"x\": 75, \"showarrow\": false}, {\"xref\": \"x\", \"yref\": \"y\", \"text\": \"From Jan 22, 2016 To Aug 29, 2016\", \"y\": 9600, \"x\": 115, \"showarrow\": false}, {\"xref\": \"x\", \"yref\": \"y\", \"text\": \"\", \"y\": 2000, \"x\": 121, \"ay\": 0, \"ax\": -5, \"showarrow\": true}, {\"xref\": \"x\", \"yref\": \"y\", \"text\": \"\", \"y\": 2000, \"x\": 45, \"ay\": 0, \"ax\": 5, \"showarrow\": true}]}, {\"linkText\": \"Export to plot.ly\", \"showLink\": true})});</script>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "trace1 = go.Scatter(\n",
    "    x=plotly_df['day'],\n",
    "    y=plotly_df['total_downloads'],\n",
    "    name='Plotly',\n",
    "    mode='lines',\n",
    "    line=dict(width=0.5,\n",
    "              color='rgb(10. 240, 10)'),\n",
    "    fill='tonexty'\n",
    ")\n",
    "\n",
    "trace2 = go.Scatter(\n",
    "    x=bokeh_df['day'],\n",
    "    y=bokeh_df['total_downloads'],\n",
    "    name='Bokeh',\n",
    "    mode='lines',\n",
    "    line=dict(width=0.5,\n",
    "              color='rgb(42, 77, 20)'),\n",
    "    fill='tonexty'\n",
    ")\n",
    "\n",
    "trace3 = go.Scatter(\n",
    "    x=mpld3_df['day'],\n",
    "    y=mpld3_df['total_downloads'],\n",
    "    name='MPLD3',\n",
    "    mode='lines',\n",
    "    line=dict(width=0.5,\n",
    "              color='rgb(20, 33, 61)'),\n",
    "    fill='tonexty'\n",
    ")\n",
    "\n",
    "trace4 = go.Scatter(\n",
    "    x=vincent_df['day'],\n",
    "    y=vincent_df['total_downloads'],\n",
    "    name='Vincent',\n",
    "    mode='lines',\n",
    "    line=dict(width=0.5,\n",
    "              color='rgb(0, 0, 0)'),\n",
    "    fill='tonexty'\n",
    ")\n",
    "\n",
    "data = [trace1, trace2, trace3, trace4]\n",
    "\n",
    "layout = go.Layout(\n",
    "    title='Package Downloads Comparison (Daily)',\n",
    "    showlegend=True,\n",
    "    xaxis=dict(\n",
    "        type='category',\n",
    "        showgrid=False\n",
    "    ),\n",
    "    yaxis=dict(\n",
    "        title='No. of downloads (daily)',\n",
    "        type='linear',\n",
    "        range=[1, 10000]\n",
    "    ),\n",
    "    plot_bgcolor='rgba(250, 250, 250, 1)',\n",
    "    shapes=[\n",
    "        dict(\n",
    "            type='line',\n",
    "            xref='x',\n",
    "            yref='y',\n",
    "            x0='45',\n",
    "            y0='2000',\n",
    "            x1='120',\n",
    "            y1='2000'\n",
    "        )\n",
    "    ],\n",
    "    annotations=[\n",
    "        dict(\n",
    "            x=75,\n",
    "            y=2400,\n",
    "            xref='x',\n",
    "            yref='y',\n",
    "            text=\"PyPI's stats collection service was down from March 6 to May 21\",\n",
    "            showarrow=False\n",
    "        ),\n",
    "        dict(\n",
    "            x=115,\n",
    "            y=9600,\n",
    "            xref='x',\n",
    "            yref='y',\n",
    "            text='From Jan 22, 2016 To Aug 29, 2016',\n",
    "            showarrow=False\n",
    "        ),\n",
    "        dict(\n",
    "            x=121,\n",
    "            y=2000,\n",
    "            xref='x',\n",
    "            yref='y',\n",
    "            text=\"\",\n",
    "            showarrow=True,\n",
    "            ay=0,\n",
    "            ax=-5\n",
    "        ),\n",
    "        dict(\n",
    "            x=45,\n",
    "            y=2000,\n",
    "            xref='x',\n",
    "            yref='y',\n",
    "            text=\"\",\n",
    "            showarrow=True,\n",
    "            ay=0,\n",
    "            ax=5\n",
    "        )\n",
    "    ]\n",
    ")\n",
    "\n",
    "fig = go.Figure(data=data, layout=layout)\n",
    "iplot(fig)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Package Downloads Comparison (Monthly)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "The dataset was created on Jan 22, 2016. We will use these months on the x-axis."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 129,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "months = ['Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug']"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "We are using pandas' `groupby` method to gather all the row by their `month` value and then adding their count to find out 'total downloads' in the month."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 130,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>total_downloads</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>month</th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>6791</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>25920</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>6008</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>15946</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>52043</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>61338</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>92813</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       total_downloads\n",
       "month                 \n",
       "1                 6791\n",
       "2                25920\n",
       "3                 6008\n",
       "4                    0\n",
       "5                15946\n",
       "6                52043\n",
       "7                61338\n",
       "8                92813"
      ]
     },
     "execution_count": 130,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "plotly_df.groupby('month').sum()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 131,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "trace1 = go.Bar(x=months, y=plotly_df.groupby('month').sum()['total_downloads'], name='Plotly')\n",
    "trace2 = go.Bar(x=months, y=vincent_df.groupby('month').sum()['total_downloads'], name='Vincent')\n",
    "trace3 = go.Bar(x=months, y=bokeh_df.groupby('month').sum()['total_downloads'], name='Bokeh')\n",
    "trace4 = go.Bar(x=months, y=mpld3_df.groupby('month').sum()['total_downloads'], name='MPLD3')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 132,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div id=\"c0b84d8b-927f-4901-84d6-0111360909bf\" style=\"height: 525px; width: 100%;\" class=\"plotly-graph-div\"></div><script type=\"text/javascript\">require([\"plotly\"], function(Plotly) { window.PLOTLYENV=window.PLOTLYENV || {};window.PLOTLYENV.BASE_URL=\"https://plot.ly\";Plotly.newPlot(\"c0b84d8b-927f-4901-84d6-0111360909bf\", [{\"y\": [6791, 25920, 6008, 0, 15946, 52043, 61338, 92813], \"x\": [\"Jan\", \"Feb\", \"Mar\", \"Apr\", \"May\", \"Jun\", \"Jul\", \"Aug\"], \"type\": \"bar\", \"name\": \"Plotly\"}, {\"y\": [609, 2010, 470, 0, 1159, 3497, 3748, 3984], \"x\": [\"Jan\", \"Feb\", \"Mar\", \"Apr\", \"May\", \"Jun\", \"Jul\", \"Aug\"], \"type\": \"bar\", \"name\": \"Vincent\"}, {\"y\": [3459, 11734, 2314, 0, 5415, 20548, 20312, 19889], \"x\": [\"Jan\", \"Feb\", \"Mar\", \"Apr\", \"May\", \"Jun\", \"Jul\", \"Aug\"], \"type\": \"bar\", \"name\": \"Bokeh\"}, {\"y\": [915, 3014, 628, 0, 1246, 3823, 5344, 5323], \"x\": [\"Jan\", \"Feb\", \"Mar\", \"Apr\", \"May\", \"Jun\", \"Jul\", \"Aug\"], \"type\": \"bar\", \"name\": \"MPLD3\"}], {\"barmode\": \"group\", \"title\": \"Package Downloads Comparison (PyPI)\", \"annotations\": [{\"xref\": \"x\", \"arrowhead\": 2, \"yref\": \"y\", \"text\": \"PyPI's stats collection service<br>was down from March 6 to May 21\", \"y\": 0, \"x\": 3, \"ay\": -150, \"ax\": 0, \"showarrow\": true}, {\"xref\": \"x\", \"yref\": \"y\", \"text\": \"From Jan 22, 2016 To Aug 29, 2016\", \"y\": 90000, \"x\": 3.7, \"showarrow\": false}], \"xaxis\": {\"title\": \"Month\"}, \"yaxis\": {\"title\": \"No. of downloads (monthly)\"}}, {\"linkText\": \"Export to plot.ly\", \"showLink\": true})});</script>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "data = [trace1, trace2, trace3, trace4]\n",
    "\n",
    "layout = go.Layout(\n",
    "    barmode='group',\n",
    "    title=\"Package Downloads Comparison (PyPI)\",\n",
    "    yaxis=dict(\n",
    "        title='No. of downloads (monthly)'\n",
    "    ),\n",
    "    xaxis=dict(\n",
    "        title='Month'\n",
    "    ),\n",
    "    annotations=[\n",
    "        dict(\n",
    "            x=3,\n",
    "            y=0,\n",
    "            xref='x',\n",
    "            yref='y',\n",
    "            text=\"PyPI's stats collection service<br>was down from March 6 to May 21\",\n",
    "            showarrow=True,\n",
    "            arrowhead=2,\n",
    "            ax=0,\n",
    "            ay=-150\n",
    "        ),\n",
    "        dict(\n",
    "            x=3.7,\n",
    "            y=90000,\n",
    "            xref='x',\n",
    "            yref='y',\n",
    "            text='From Jan 22, 2016 To Aug 29, 2016',\n",
    "            showarrow=False\n",
    "        )\n",
    "    ]\n",
    ")\n",
    "fig = go.Figure(data=data, layout=layout)\n",
    "iplot(fig)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "collapsed": true
   },
   "source": [
    "### Growth of Plotly package downloads"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Following the tutorial [Linear fit in Python](https://plot.ly/python/linear-fits/), we will try to find an\n",
    "approximate regression line for the scatter graph of Plotly package's downloads."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 155,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "xvals = np.arange(0, len(plotly_df))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "The following `traces` are for the package downloads scatter plot (for each package)."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 207,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div id=\"933dc426-7d28-420a-9cd1-42ba2b3b0827\" style=\"height: 525px; width: 100%;\" class=\"plotly-graph-div\"></div><script type=\"text/javascript\">require([\"plotly\"], function(Plotly) { window.PLOTLYENV=window.PLOTLYENV || {};window.PLOTLYENV.BASE_URL=\"https://plot.ly\";Plotly.newPlot(\"933dc426-7d28-420a-9cd1-42ba2b3b0827\", [{\"name\": \"Plotly Downloads\", \"marker\": {\"color\": \"rgb(255, 127, 14)\", \"symbol\": \"x\", \"size\": 5}, \"mode\": \"markers\", \"y\": [801, 334, 480, 762, 817, 1373, 653, 718, 489, 364, 900, 830, 750, 1014, 1151, 472, 556, 689, 1124, 738, 983, 880, 513, 392, 632, 950, 1092, 980, 1308, 627, 484, 880, 1433, 1207, 1643, 1014, 901, 782, 995, 1478, 1225, 1099, 1110, 1096], \"x\": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43], \"type\": \"scatter\"}, {\"showlegend\": false, \"name\": \"Plotly Downloads\", \"marker\": {\"color\": \"rgb(255, 127, 14)\", \"symbol\": \"x\", \"size\": 5}, \"mode\": \"markers\", \"y\": [1054, 1738, 1622, 1814, 2226, 2172, 1189, 866, 1623, 1642, 2464, 2361, 2000, 1645, 1002, 2013, 2416, 1972, 1546, 2812, 874, 726, 2204, 2525, 1613, 1500, 1832, 934, 711, 1944, 1724, 1851, 2628, 1790, 1001, 1075, 1504, 1542, 1619, 2215, 1615, 1154, 787, 1111, 1359, 2244, 2006, 2260, 1895, 1092, 2300, 2432, 2378, 3063, 2521, 1546, 1195, 2368, 2673, 2458, 3163, 2499, 1095, 814, 2182, 2655, 2515, 3089, 2869, 969, 1031, 2110, 2851, 2759, 2871, 3139, 1331, 1236, 2936, 3010, 3667, 2534, 3227, 1271, 1101, 2517, 2575, 4068, 3102, 2826, 2195, 1224, 2708, 3134, 2556, 3085, 9340, 8579, 8098, 2763], \"x\": [121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220], \"type\": \"scatter\"}, {\"name\": \"Plotly Regression Line\", \"marker\": {\"color\": \"rgb(10, 20, 30)\"}, \"mode\": \"lines\", \"y\": [-282.5564387917327, -269.25722147486835, -255.95800415800397, -242.6587868411396, -229.35956952427523, -216.06035220741086, -202.76113489054646, -189.4619175736821, -176.16270025681771, -162.86348293995334, -149.56426562308897, -136.2650483062246, -122.9658309893602, -109.66661367249583, -96.36739635563146, -83.06817903876708, -69.76896172190271, -56.46974440503834, -43.17052708817397, -29.871309771309598, -16.572092454445226, -3.2728751375808542, 10.026342179283517, 23.32555949614789, 36.62477681301232, 49.92399412987669, 63.22321144674106, 76.52242876360543, 89.8216460804698, 103.12086339733418, 116.42008071419855, 129.71929803106292, 143.0185153479273, 156.31773266479166, 169.61694998165603, 182.9161672985204, 196.21538461538478, 209.51460193224915, 222.81381924911352, 236.11303656597795, 249.41225388284226, 262.7114711997067, 276.010688516571, 289.30990583343544, 302.60912315029975, 315.9083404671642, 329.2075577840285, 342.5067751008929, 355.80599241775735, 369.10520973462167, 382.4044270514861, 395.7036443683504, 409.00286168521484, 422.30207900207915, 435.6012963189436, 448.9005136358079, 462.1997309526723, 475.49894826953664, 488.79816558640107, 502.0973829032654, 515.3966002201298, 528.6958175369941, 541.9950348538586, 555.2942521707229, 568.5934694875873, 581.8926868044517, 595.191904121316, 608.4911214381805, 621.7903387550448, 635.0895560719092, 648.3887733887735, 661.687990705638, 674.9872080225023, 688.2864253393667, 701.585642656231, 714.8848599730954, 728.1840772899598, 741.4832946068241, 754.7825119236886, 768.0817292405529, 781.3809465574172, 794.6801638742818, 807.9793811911461, 821.2785985080104, 834.5778158248747, 847.8770331417393, 861.1762504586036, 874.4754677754679, 887.7746850923322, 901.0739024091968, 914.3731197260611, 927.6723370429254, 940.9715543597897, 954.2707716766542, 967.5699889935186, 980.8692063103829, 994.1684236272474, 1007.4676409441117, 1020.766858260976, 1034.0660755778404, 1047.365292894705, 1060.6645102115692, 1073.9637275284335, 1087.2629448452979, 1100.5621621621624, 1113.8613794790267, 1127.160596795891, 1140.4598141127553, 1153.7590314296199, 1167.0582487464842, 1180.3574660633485, 1193.6566833802128, 1206.9559006970774, 1220.2551180139417, 1233.554335330806, 1246.8535526476705, 1260.1527699645349, 1273.4519872813992, 1286.7512045982635, 1300.050421915128, 1313.3496392319923, 1326.6488565488567, 1339.948073865721, 1353.2472911825855, 1366.5465084994498, 1379.8457258163141, 1393.1449431331785, 1406.444160450043, 1419.7433777669073, 1433.0425950837716, 1446.3418124006362, 1459.6410297175005, 1472.9402470343648, 1486.2394643512291, 1499.5386816680937, 1512.837898984958, 1526.1371163018223, 1539.4363336186866, 1552.7355509355511, 1566.0347682524155, 1579.3339855692798, 1592.633202886144, 1605.9324202030086, 1619.231637519873, 1632.5308548367373, 1645.8300721536018, 1659.1292894704661, 1672.4285067873304, 1685.7277241041947, 1699.0269414210593, 1712.3261587379236, 1725.625376054788, 1738.9245933716522, 1752.2238106885168, 1765.5230280053809, 1778.8222453222454, 1792.12146263911, 1805.420679955974, 1818.7198972728386, 1832.0191145897031, 1845.3183319065672, 1858.6175492234318, 1871.9167665402963, 1885.2159838571604, 1898.515201174025, 1911.814418490889, 1925.1136358077536, 1938.412853124618, 1951.7120704414822, 1965.0112877583467, 1978.3105050752113, 1991.6097223920754, 2004.90893970894, 2018.208157025804, 2031.5073743426685, 2044.806591659533, 2058.1058089763974, 2071.4050262932615, 2084.7042436101265, 2098.0034609269906, 2111.3026782438546, 2124.6018955607196, 2137.9011128775837, 2151.200330194448, 2164.499547511312, 2177.798764828177, 2191.097982145041, 2204.397199461905, 2217.69641677877, 2230.995634095634, 2244.2948514124982, 2257.5940687293632, 2270.8932860462273, 2284.1925033630914, 2297.4917206799564, 2310.7909379968205, 2324.0901553136846, 2337.3893726305496, 2350.6885899474137, 2363.9878072642778, 2377.2870245811428, 2390.586241898007, 2403.885459214871, 2417.184676531735, 2430.4838938486, 2443.783111165464, 2457.082328482328, 2470.381545799193, 2483.6807631160573, 2496.9799804329214, 2510.2791977497864, 2523.5784150666505, 2536.8776323835145, 2550.1768497003795, 2563.4760670172436, 2576.7752843341077, 2590.0745016509727, 2603.373718967837, 2616.672936284701, 2629.972153601566, 2643.27137091843], \"x\": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220], \"line\": {\"dash\": \"longdashdot\", \"width\": 1, \"color\": \"rgba(10, 10, 10, 1)\"}, \"type\": \"scatter\"}], {\"title\": \"Linear Regression Line for Plotly's Package Downloads Growth\", \"annotations\": [{\"xref\": \"x\", \"yref\": \"y\", \"text\": \"<b>Y = 13.29X - 282.55</b>\", \"y\": 2000, \"x\": 85, \"showarrow\": false}], \"xaxis\": {\"title\": \"# days\"}, \"yaxis\": {\"title\": \"No. of downloads (daily)\"}}, {\"linkText\": \"Export to plot.ly\", \"showLink\": true})});</script>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "trace1 = go.Scatter(\n",
    "    x=xvals[:44], \n",
    "    y=plotly_df['total_downloads'].iloc[:44], \n",
    "    mode='markers',\n",
    "    marker=go.Marker(color='rgb(255, 127, 14)',size=5,symbol='x'),\n",
    "    name='Plotly Downloads'\n",
    ")\n",
    "\n",
    "trace2 = go.Scatter(\n",
    "    x=xvals[121:], \n",
    "    y=plotly_df['total_downloads'].iloc[121:],\n",
    "    mode='markers',\n",
    "    marker=go.Marker(color='rgb(255, 127, 14)',size=5,symbol='x'),\n",
    "    name='Plotly Downloads',\n",
    "    showlegend=False\n",
    ")\n",
    "\n",
    "# linear regression line for Plotly package downloads\n",
    "pslope, pintercept, pr_value, pp_value, pstd_err = linregress(xvals, plotly_df['total_downloads'])\n",
    "plotly_line = pslope*xvals + pintercept\n",
    "\n",
    "trace3 = go.Scatter(\n",
    "    x=xvals, \n",
    "    y=plotly_line, \n",
    "    mode='lines',\n",
    "    marker=go.Marker(color='rgb(10, 20, 30)'),\n",
    "    name='Plotly Regression Line',\n",
    "    line=dict(\n",
    "        color='rgba(10, 10, 10, 1)',\n",
    "        width=1,\n",
    "        dash='longdashdot'\n",
    "    )\n",
    ")\n",
    "\n",
    "layout = go.Layout(\n",
    "    title='Linear Regression Line for Plotly\\'s Package Downloads Growth',\n",
    "    yaxis = dict(\n",
    "        title='No. of downloads (daily)'\n",
    "    ),\n",
    "    xaxis = dict(\n",
    "        title='# days'\n",
    "    ),\n",
    "    annotations=[\n",
    "        dict(\n",
    "            x=85,\n",
    "            y=2000,\n",
    "            xref='x',\n",
    "            yref='y',\n",
    "            text=\"<b>Y = 13.29X - 282.55</b>\",\n",
    "            showarrow=False\n",
    "        )\n",
    "    ]\n",
    ")\n",
    "\n",
    "data = [trace1, trace2, trace3]\n",
    "\n",
    "fig = go.Figure(data=data, layout=layout)\n",
    "iplot(fig)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Similary, we can find the approximate growth line for 'Matplotlib'."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 204,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "mslope, mintercept, mr_value, mp_value, mstd_err = linregress(xvals, matplotlib_df['total_downloads'])\n",
    "matplotlib_line = mslope*xvals + mintercept"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Daily download counts for 'Matplotlib' ranges around 7000-8000 as of now."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Let's find out how much time will it take for Plotly to reach that level."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Using the Plotly's growth line equation $Y = 13.29X - 282.55$, we can find out the approximate no. of days for downloads to reach 8000."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "$Y(8000)$, results in X = 624 (nearest integer value), where current day index is 220 as of Aug 29, 2016.\n",
    "\n",
    "#### That means it will take around 404 days for Plotly's download range to reach 8000."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 229,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div id=\"69fb0e37-01d9-4441-b1cb-cd6e66a42212\" style=\"height: 525px; width: 100%;\" class=\"plotly-graph-div\"></div><script type=\"text/javascript\">require([\"plotly\"], function(Plotly) { window.PLOTLYENV=window.PLOTLYENV || {};window.PLOTLYENV.BASE_URL=\"https://plot.ly\";Plotly.newPlot(\"69fb0e37-01d9-4441-b1cb-cd6e66a42212\", [{\"name\": \"Plotly Regression (Actual)\", \"marker\": {\"color\": \"rgb(10, 20, 30)\"}, \"mode\": \"lines\", \"y\": [-282.5564387917327, -269.25722147486835, -255.95800415800397, -242.6587868411396, -229.35956952427523, -216.06035220741086, -202.76113489054646, -189.4619175736821, -176.16270025681771, -162.86348293995334, -149.56426562308897, -136.2650483062246, -122.9658309893602, -109.66661367249583, -96.36739635563146, -83.06817903876708, -69.76896172190271, -56.46974440503834, -43.17052708817397, -29.871309771309598, -16.572092454445226, -3.2728751375808542, 10.026342179283517, 23.32555949614789, 36.62477681301232, 49.92399412987669, 63.22321144674106, 76.52242876360543, 89.8216460804698, 103.12086339733418, 116.42008071419855, 129.71929803106292, 143.0185153479273, 156.31773266479166, 169.61694998165603, 182.9161672985204, 196.21538461538478, 209.51460193224915, 222.81381924911352, 236.11303656597795, 249.41225388284226, 262.7114711997067, 276.010688516571, 289.30990583343544, 302.60912315029975, 315.9083404671642, 329.2075577840285, 342.5067751008929, 355.80599241775735, 369.10520973462167, 382.4044270514861, 395.7036443683504, 409.00286168521484, 422.30207900207915, 435.6012963189436, 448.9005136358079, 462.1997309526723, 475.49894826953664, 488.79816558640107, 502.0973829032654, 515.3966002201298, 528.6958175369941, 541.9950348538586, 555.2942521707229, 568.5934694875873, 581.8926868044517, 595.191904121316, 608.4911214381805, 621.7903387550448, 635.0895560719092, 648.3887733887735, 661.687990705638, 674.9872080225023, 688.2864253393667, 701.585642656231, 714.8848599730954, 728.1840772899598, 741.4832946068241, 754.7825119236886, 768.0817292405529, 781.3809465574172, 794.6801638742818, 807.9793811911461, 821.2785985080104, 834.5778158248747, 847.8770331417393, 861.1762504586036, 874.4754677754679, 887.7746850923322, 901.0739024091968, 914.3731197260611, 927.6723370429254, 940.9715543597897, 954.2707716766542, 967.5699889935186, 980.8692063103829, 994.1684236272474, 1007.4676409441117, 1020.766858260976, 1034.0660755778404, 1047.365292894705, 1060.6645102115692, 1073.9637275284335, 1087.2629448452979, 1100.5621621621624, 1113.8613794790267, 1127.160596795891, 1140.4598141127553, 1153.7590314296199, 1167.0582487464842, 1180.3574660633485, 1193.6566833802128, 1206.9559006970774, 1220.2551180139417, 1233.554335330806, 1246.8535526476705, 1260.1527699645349, 1273.4519872813992, 1286.7512045982635, 1300.050421915128, 1313.3496392319923, 1326.6488565488567, 1339.948073865721, 1353.2472911825855, 1366.5465084994498, 1379.8457258163141, 1393.1449431331785, 1406.444160450043, 1419.7433777669073, 1433.0425950837716, 1446.3418124006362, 1459.6410297175005, 1472.9402470343648, 1486.2394643512291, 1499.5386816680937, 1512.837898984958, 1526.1371163018223, 1539.4363336186866, 1552.7355509355511, 1566.0347682524155, 1579.3339855692798, 1592.633202886144, 1605.9324202030086, 1619.231637519873, 1632.5308548367373, 1645.8300721536018, 1659.1292894704661, 1672.4285067873304, 1685.7277241041947, 1699.0269414210593, 1712.3261587379236, 1725.625376054788, 1738.9245933716522, 1752.2238106885168, 1765.5230280053809, 1778.8222453222454, 1792.12146263911, 1805.420679955974, 1818.7198972728386, 1832.0191145897031, 1845.3183319065672, 1858.6175492234318, 1871.9167665402963, 1885.2159838571604, 1898.515201174025, 1911.814418490889, 1925.1136358077536, 1938.412853124618, 1951.7120704414822, 1965.0112877583467, 1978.3105050752113, 1991.6097223920754, 2004.90893970894, 2018.208157025804, 2031.5073743426685, 2044.806591659533, 2058.1058089763974, 2071.4050262932615, 2084.7042436101265, 2098.0034609269906, 2111.3026782438546, 2124.6018955607196, 2137.9011128775837, 2151.200330194448, 2164.499547511312, 2177.798764828177, 2191.097982145041, 2204.397199461905, 2217.69641677877, 2230.995634095634, 2244.2948514124982, 2257.5940687293632, 2270.8932860462273, 2284.1925033630914, 2297.4917206799564, 2310.7909379968205, 2324.0901553136846, 2337.3893726305496, 2350.6885899474137, 2363.9878072642778, 2377.2870245811428, 2390.586241898007, 2403.885459214871, 2417.184676531735, 2430.4838938486, 2443.783111165464, 2457.082328482328, 2470.381545799193, 2483.6807631160573, 2496.9799804329214, 2510.2791977497864, 2523.5784150666505, 2536.8776323835145, 2550.1768497003795, 2563.4760670172436, 2576.7752843341077, 2590.0745016509727, 2603.373718967837, 2616.672936284701, 2629.972153601566, 2643.27137091843], \"x\": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220], \"line\": {\"dash\": \"longdashdot\", \"width\": 1, \"color\": \"rgba(10, 10, 10, 1)\"}, \"type\": \"scatter\"}, {\"name\": \"Plotly Regression (Prediction)\", \"marker\": {\"color\": \"rgb(10, 20, 30)\"}, \"mode\": \"lines\", \"y\": [2656.570588235294, 2669.869805552158, 2683.169022869023, 2696.468240185887, 2709.7674575027513, 2723.0666748196163, 2736.3658921364804, 2749.6651094533445, 2762.9643267702095, 2776.2635440870736, 2789.5627614039377, 2802.8619787208027, 2816.1611960376667, 2829.460413354531, 2842.759630671396, 2856.05884798826, 2869.358065305124, 2882.657282621989, 2895.956499938853, 2909.255717255717, 2922.554934572582, 2935.8541518894463, 2949.1533692063103, 2962.4525865231744, 2975.7518038400394, 2989.0510211569035, 3002.3502384737676, 3015.6494557906326, 3028.9486731074967, 3042.247890424361, 3055.547107741226, 3068.84632505809, 3082.145542374954, 3095.444759691819, 3108.743977008683, 3122.043194325547, 3135.342411642412, 3148.641628959276, 3161.9408462761403, 3175.2400635930053, 3188.5392809098694, 3201.8384982267335, 3215.1377155435976, 3228.4369328604625, 3241.7361501773266, 3255.0353674941907, 3268.3345848110557, 3281.63380212792, 3294.933019444784, 3308.232236761649, 3321.531454078513, 3334.830671395377, 3348.129888712242, 3361.429106029106, 3374.7283233459702, 3388.0275406628352, 3401.3267579796993, 3414.6259752965634, 3427.9251926134284, 3441.2244099302925, 3454.5236272471566, 3467.8228445640207, 3481.1220618808857, 3494.4212791977498, 3507.720496514614, 3521.019713831479, 3534.318931148343, 3547.618148465207, 3560.917365782072, 3574.216583098936, 3587.5158004158, 3600.815017732665, 3614.1142350495293, 3627.4134523663934, 3640.7126696832584, 3654.0118870001224, 3667.3111043169865, 3680.6103216338515, 3693.9095389507156, 3707.2087562675797, 3720.507973584444, 3733.807190901309, 3747.106408218173, 3760.405625535037, 3773.704842851902, 3787.004060168766, 3800.30327748563, 3813.602494802494, 3826.901712119359, 3840.2009294362233, 3853.5001467530874, 3866.7993640699524, 3880.0985813868165, 3893.3977987036806, 3906.6970160205456, 3919.9962333374096, 3933.2954506542737, 3946.5946679711387, 3959.893885288003, 3973.193102604867, 3986.492319921732, 3999.791537238596, 4013.09075455546, 4026.389971872325, 4039.689189189189, 4052.9884065060533, 4066.2876238229173, 4079.5868411397823, 4092.8860584566464, 4106.1852757735105, 4119.4844930903755, 4132.78371040724, 4146.082927724104, 4159.382145040969, 4172.681362357833, 4185.980579674697, 4199.279796991562, 4212.579014308426, 4225.87823162529, 4239.177448942155, 4252.476666259019, 4265.775883575883, 4279.075100892748, 4292.374318209612, 4305.673535526476, 4318.9727528433405, 4332.2719701602055, 4345.5711874770695, 4358.870404793934, 4372.169622110799, 4385.468839427663, 4398.768056744527, 4412.067274061392, 4425.366491378256, 4438.66570869512, 4451.964926011985, 4465.264143328849, 4478.563360645713, 4491.862577962578, 4505.161795279442, 4518.461012596306, 4531.760229913171, 4545.059447230035, 4558.3586645468995, 4571.657881863764, 4584.957099180629, 4598.256316497493, 4611.555533814357, 4624.854751131222, 4638.153968448086, 4651.45318576495, 4664.752403081815, 4678.051620398679, 4691.350837715543, 4704.650055032408, 4717.949272349272, 4731.248489666136, 4744.547706983001, 4757.846924299865, 4771.146141616729, 4784.445358933594, 4797.7445762504585, 4811.043793567323, 4824.343010884188, 4837.642228201052, 4850.941445517916, 4864.24066283478, 4877.539880151645, 4890.839097468509, 4904.138314785373, 4917.437532102238, 4930.736749419102, 4944.035966735966, 4957.335184052831, 4970.634401369695, 4983.933618686559, 4997.232836003424, 5010.5320533202885, 5023.831270637153, 5037.130487954018, 5050.429705270882, 5063.728922587746, 5077.028139904611, 5090.327357221475, 5103.626574538339, 5116.925791855203, 5130.225009172068, 5143.524226488932, 5156.823443805796, 5170.122661122661, 5183.421878439525, 5196.721095756389, 5210.020313073254, 5223.319530390118, 5236.6187477069825, 5249.9179650238475, 5263.217182340712, 5276.516399657576, 5289.815616974441, 5303.114834291305, 5316.414051608169, 5329.713268925034, 5343.012486241898, 5356.311703558762, 5369.610920875626, 5382.910138192491, 5396.209355509355, 5409.508572826219, 5422.807790143084, 5436.107007459948, 5449.406224776812, 5462.705442093677, 5476.0046594105415, 5489.303876727406, 5502.603094044271, 5515.902311361135, 5529.201528677999, 5542.500745994864, 5555.799963311728, 5569.099180628592, 5582.398397945457, 5595.697615262321, 5608.996832579185, 5622.296049896049, 5635.595267212914, 5648.894484529778, 5662.193701846642, 5675.492919163507, 5688.7921364803715, 5702.091353797236, 5715.390571114101, 5728.689788430965, 5741.989005747829, 5755.288223064694, 5768.587440381558, 5781.886657698422, 5795.185875015287, 5808.485092332151, 5821.784309649015, 5835.08352696588, 5848.382744282744, 5861.681961599608, 5874.981178916472, 5888.280396233337, 5901.579613550201, 5914.8788308670655, 5928.1780481839305, 5941.477265500795, 5954.776482817659, 5968.075700134524, 5981.374917451388, 5994.674134768252, 6007.973352085117, 6021.272569401981, 6034.571786718845, 6047.87100403571, 6061.170221352574, 6074.469438669438, 6087.768655986303, 6101.067873303167, 6114.367090620031, 6127.666307936896, 6140.9655252537605, 6154.264742570625, 6167.563959887489, 6180.863177204354, 6194.162394521218, 6207.461611838082, 6220.760829154947, 6234.060046471811, 6247.359263788675, 6260.65848110554, 6273.957698422404, 6287.256915739268, 6300.556133056133, 6313.855350372997, 6327.154567689861, 6340.453785006726, 6353.75300232359, 6367.0522196404545, 6380.3514369573195, 6393.650654274184, 6406.949871591048, 6420.249088907912, 6433.548306224777, 6446.847523541641, 6460.146740858505, 6473.44595817537, 6486.745175492234, 6500.044392809098, 6513.343610125963, 6526.642827442827, 6539.942044759691, 6553.241262076556, 6566.54047939342, 6579.839696710284, 6593.138914027149, 6606.4381313440135, 6619.737348660878, 6633.036565977743, 6646.335783294607, 6659.635000611471, 6672.934217928335, 6686.2334352452, 6699.532652562064, 6712.831869878928, 6726.131087195793, 6739.430304512657, 6752.729521829521, 6766.028739146386, 6779.32795646325, 6792.627173780114, 6805.926391096979, 6819.2256084138435, 6832.524825730708, 6845.824043047573, 6859.123260364437, 6872.422477681301, 6885.721694998166, 6899.02091231503, 6912.320129631894, 6925.619346948758, 6938.918564265623, 6952.217781582487, 6965.516998899351, 6978.816216216216, 6992.11543353308, 7005.414650849944, 7018.713868166809, 7032.013085483673, 7045.3123028005375, 7058.6115201174025, 7071.910737434267, 7085.209954751131, 7098.509172067996, 7111.80838938486, 7125.107606701724, 7138.406824018589, 7151.706041335453, 7165.005258652317, 7178.304475969182, 7191.603693286046, 7204.90291060291, 7218.202127919774, 7231.501345236639, 7244.800562553503, 7258.0997798703675, 7271.398997187232, 7284.6982145040965, 7297.997431820961, 7311.296649137826, 7324.59586645469, 7337.895083771554, 7351.194301088419, 7364.493518405283, 7377.792735722147, 7391.091953039012, 7404.391170355876, 7417.69038767274, 7430.989604989605, 7444.288822306469, 7457.588039623333, 7470.887256940197, 7484.186474257062, 7497.4856915739265, 7510.784908890791, 7524.084126207656, 7537.38334352452, 7550.682560841384, 7563.981778158249, 7577.280995475113, 7590.580212791977, 7603.879430108842, 7617.178647425706, 7630.47786474257, 7643.777082059435, 7657.076299376299, 7670.375516693163, 7683.674734010028, 7696.973951326892, 7710.273168643756, 7723.5723859606205, 7736.8716032774855, 7750.17082059435, 7763.470037911214, 7776.769255228079, 7790.068472544943, 7803.367689861807, 7816.666907178672, 7829.966124495536, 7843.2653418124, 7856.564559129265, 7869.863776446129, 7883.162993762993, 7896.462211079858, 7909.761428396721, 7923.060645713587, 7936.359863030451, 7949.6590803473155, 7962.95829766418, 7976.257514981044, 7989.556732297908, 8002.855949614774, 8016.155166931638], \"x\": [221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300, 301, 302, 303, 304, 305, 306, 307, 308, 309, 310, 311, 312, 313, 314, 315, 316, 317, 318, 319, 320, 321, 322, 323, 324, 325, 326, 327, 328, 329, 330, 331, 332, 333, 334, 335, 336, 337, 338, 339, 340, 341, 342, 343, 344, 345, 346, 347, 348, 349, 350, 351, 352, 353, 354, 355, 356, 357, 358, 359, 360, 361, 362, 363, 364, 365, 366, 367, 368, 369, 370, 371, 372, 373, 374, 375, 376, 377, 378, 379, 380, 381, 382, 383, 384, 385, 386, 387, 388, 389, 390, 391, 392, 393, 394, 395, 396, 397, 398, 399, 400, 401, 402, 403, 404, 405, 406, 407, 408, 409, 410, 411, 412, 413, 414, 415, 416, 417, 418, 419, 420, 421, 422, 423, 424, 425, 426, 427, 428, 429, 430, 431, 432, 433, 434, 435, 436, 437, 438, 439, 440, 441, 442, 443, 444, 445, 446, 447, 448, 449, 450, 451, 452, 453, 454, 455, 456, 457, 458, 459, 460, 461, 462, 463, 464, 465, 466, 467, 468, 469, 470, 471, 472, 473, 474, 475, 476, 477, 478, 479, 480, 481, 482, 483, 484, 485, 486, 487, 488, 489, 490, 491, 492, 493, 494, 495, 496, 497, 498, 499, 500, 501, 502, 503, 504, 505, 506, 507, 508, 509, 510, 511, 512, 513, 514, 515, 516, 517, 518, 519, 520, 521, 522, 523, 524, 525, 526, 527, 528, 529, 530, 531, 532, 533, 534, 535, 536, 537, 538, 539, 540, 541, 542, 543, 544, 545, 546, 547, 548, 549, 550, 551, 552, 553, 554, 555, 556, 557, 558, 559, 560, 561, 562, 563, 564, 565, 566, 567, 568, 569, 570, 571, 572, 573, 574, 575, 576, 577, 578, 579, 580, 581, 582, 583, 584, 585, 586, 587, 588, 589, 590, 591, 592, 593, 594, 595, 596, 597, 598, 599, 600, 601, 602, 603, 604, 605, 606, 607, 608, 609, 610, 611, 612, 613, 614, 615, 616, 617, 618, 619, 620, 621, 622, 623, 624], \"line\": {\"dash\": \"dot\", \"width\": 1, \"color\": \"rgba(10, 10, 10, 1)\"}, \"type\": \"scatter\"}], {\"shapes\": [{\"xref\": \"x\", \"yref\": \"y\", \"y1\": 8000, \"y0\": 8000, \"line\": {\"dash\": \"solid\", \"width\": 1, \"color\": \"rgba(10, 10, 10, 1)\"}, \"x1\": 624, \"type\": \"line\", \"x0\": 0}, {\"xref\": \"x\", \"yref\": \"y\", \"y1\": 8000, \"y0\": 0, \"line\": {\"dash\": \"solid\", \"width\": 1, \"color\": \"rgba(10, 10, 10, 1)\"}, \"x1\": 624, \"type\": \"line\", \"x0\": 624}], \"title\": \"Prediction for Plotly's Package Downloads Growth\", \"annotations\": [{\"xref\": \"x\", \"yref\": \"y\", \"text\": \"<b>Y = 13.29X - 282.55</b>\", \"y\": 2000, \"x\": 85, \"showarrow\": false}, {\"xref\": \"x\", \"yref\": \"y\", \"text\": \"Current download range for Matplotlib\", \"y\": 7800, \"x\": 400, \"showarrow\": false}], \"xaxis\": {\"title\": \"# days\"}, \"yaxis\": {\"title\": \"No. of downloads (daily)\"}}, {\"linkText\": \"Export to plot.ly\", \"showLink\": true})});</script>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "# linear regression line for Plotly package downloads\n",
    "pslope, pintercept, pr_value, pp_value, pstd_err = linregress(xvals, plotly_df['total_downloads'])\n",
    "plotly_line = pslope*xvals + pintercept\n",
    "\n",
    "trace1 = go.Scatter(\n",
    "    x=xvals, \n",
    "    y=plotly_line, \n",
    "    mode='lines',\n",
    "    marker=go.Marker(color='rgb(10, 20, 30)'),\n",
    "    name='Plotly Regression (Actual)',\n",
    "    line=dict(\n",
    "        color='rgba(10, 10, 10, 1)',\n",
    "        width=1,\n",
    "        dash='longdashdot'\n",
    "    )\n",
    ")\n",
    "\n",
    "future_xvals = np.arange(221, 221 + 404)\n",
    "\n",
    "trace2 = go.Scatter(\n",
    "    x=future_xvals, \n",
    "    y=pslope*future_xvals+pintercept, \n",
    "    mode='lines',\n",
    "    marker=go.Marker(color='rgb(10, 20, 30)'),\n",
    "    name='Plotly Regression (Prediction)',\n",
    "    line=dict(\n",
    "        color='rgba(10, 10, 10, 1)',\n",
    "        width=1,\n",
    "        dash='dot'\n",
    "    )\n",
    ")\n",
    "\n",
    "layout = go.Layout(\n",
    "    title='Prediction for Plotly\\'s Package Downloads Growth',\n",
    "    yaxis = dict(\n",
    "        title='No. of downloads (daily)'\n",
    "    ),\n",
    "    xaxis = dict(\n",
    "        title='# days'\n",
    "    ),\n",
    "    annotations=[\n",
    "        dict(\n",
    "            x=85,\n",
    "            y=2000,\n",
    "            xref='x',\n",
    "            yref='y',\n",
    "            text=\"<b>Y = 13.29X - 282.55</b>\",\n",
    "            showarrow=False\n",
    "        ),\n",
    "        dict(\n",
    "            x=400,\n",
    "            y=7800,\n",
    "            xref='x',\n",
    "            yref='y',\n",
    "            text=\"Current download range for Matplotlib\",\n",
    "            showarrow=False\n",
    "        )\n",
    "    ],\n",
    "    shapes=[\n",
    "        dict(\n",
    "            type='line',\n",
    "            xref='x',\n",
    "            yref='y',\n",
    "            x0=0,\n",
    "            y0=8000,\n",
    "            x1=624,\n",
    "            y1=8000,\n",
    "            line=dict(\n",
    "                color='rgba(10, 10, 10, 1)',\n",
    "                width=1,\n",
    "                dash='solid'\n",
    "            )\n",
    "        ),\n",
    "        dict(\n",
    "            type='line',\n",
    "            xref='x',\n",
    "            yref='y',\n",
    "            x0=624,\n",
    "            y0=0,\n",
    "            x1=624,\n",
    "            y1=8000,\n",
    "            line=dict(\n",
    "                color='rgba(10, 10, 10, 1)',\n",
    "                width=1,\n",
    "                dash='solid'\n",
    "            )\n",
    "        )\n",
    "    ]\n",
    ")\n",
    "\n",
    "data = [trace1, trace2]\n",
    "\n",
    "fig = go.Figure(data=data, layout=layout)\n",
    "iplot(fig)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 2",
   "language": "python",
   "name": "python2"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 2
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython2",
   "version": "2.7.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 0
}