{ "metadata": { "name": "Untitled0" }, "nbformat": 3, "nbformat_minor": 0, "worksheets": [ { "cells": [ { "cell_type": "code", "collapsed": false, "input": "%matplotlib inline\nimport pandas as pd\ndata = pd.read_csv(\"emdata-tsv (1).csv\")\n ", "language": "python", "metadata": {}, "outputs": [], "prompt_number": 16 }, { "cell_type": "code", "collapsed": false, "input": "data.describe()\ndata.shape\ndata.Country.describe()\ndata.Type.describe()", "language": "python", "metadata": {}, "outputs": [ { "metadata": {}, "output_type": "pyout", "prompt_number": 18, "text": "count 17828\nunique 15\ntop Transport Accident\nfreq 4351\nName: Type, dtype: object" } ], "prompt_number": 18 }, { "cell_type": "code", "collapsed": false, "input": "data.describe()", "language": "python", "metadata": {}, "outputs": [ { "html": "
\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
StartEndDurationKilledCostAffectedColumn 12
count 17828.000000 17828.000000 17828.000000 13996.000000 1.108500e+04 3772.000000 0
mean 1990.883049 1990.918387 0.035338 2718.355173 5.586713e+05 488.759659NaN
std 17.851370 17.836943 0.302913 75162.832728 6.951056e+06 3384.235083NaN
min 1900.000000 1900.000000 0.000000 1.000000 1.000000e+00 0.003000NaN
25% 1986.000000 1986.000000 0.000000 12.000000 6.000000e+01 5.000000NaN
50% 1996.000000 1996.000000 0.000000 24.000000 1.000000e+03 35.000000NaN
75% 2003.000000 2003.000000 0.000000 57.000000 1.975000e+04 200.000000NaN
max 2008.000000 2009.000000 9.000000 5000000.000000 3.000000e+08 125000.000000NaN
\n

8 rows \u00d7 7 columns

\n
", "metadata": {}, "output_type": "pyout", "prompt_number": 19, "text": " Start End Duration Killed Cost \\\ncount 17828.000000 17828.000000 17828.000000 13996.000000 1.108500e+04 \nmean 1990.883049 1990.918387 0.035338 2718.355173 5.586713e+05 \nstd 17.851370 17.836943 0.302913 75162.832728 6.951056e+06 \nmin 1900.000000 1900.000000 0.000000 1.000000 1.000000e+00 \n25% 1986.000000 1986.000000 0.000000 12.000000 6.000000e+01 \n50% 1996.000000 1996.000000 0.000000 24.000000 1.000000e+03 \n75% 2003.000000 2003.000000 0.000000 57.000000 1.975000e+04 \nmax 2008.000000 2009.000000 9.000000 5000000.000000 3.000000e+08 \n\n Affected Column 12 \ncount 3772.000000 0 \nmean 488.759659 NaN \nstd 3384.235083 NaN \nmin 0.003000 NaN \n25% 5.000000 NaN \n50% 35.000000 NaN \n75% 200.000000 NaN \nmax 125000.000000 NaN \n\n[8 rows x 7 columns]" } ], "prompt_number": 19 }, { "cell_type": "code", "collapsed": false, "input": "print data.Killed.groupby(data.Type).sum().order()", "language": "python", "metadata": {}, "outputs": [ { "output_type": "stream", "stream": "stdout", "text": "Type\nWildfire 3287\nMass movement dry 4919\nIndustrial Accident 49797\nMass movement wet 55040\nMiscellaneous accident 58121\nVolcano 95979\nExtreme temperature 108938\nTransport Accident 201053\nStorm 1373104\nEarthquake (seismic activity) 2311491\nComplex Disasters 5610000\nFlood 6911040\nEpidemic 9555059\nDrought 11708271\nInsect infestation NaN\ndtype: float64\n" } ], "prompt_number": 23 } ], "metadata": {} } ] }