{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Extracting data and saving it to a new file" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "This exercise walks you through how to read csv-data, select certain data using selection rules and saving selected data into a new file." ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "First import the packages needed and then read and save the data from file *DoubleMuRun2011.csv* into variable *dataset*. Let's also check out the number of rows and the content of the file." ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "collapsed": true }, "outputs": [], "source": [ "import pandas as pd\n", "import matplotlib.pyplot as plt\n", "% matplotlib inline" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "The file has 475465 rows.\n" ] }, { "data": { "text/html": [ "
\n", " | Run | \n", "Event | \n", "Type1 | \n", "E1 | \n", "px1 | \n", "py1 | \n", "pz1 | \n", "pt1 | \n", "eta1 | \n", "phi1 | \n", "... | \n", "Type2 | \n", "E2 | \n", "px2 | \n", "py2 | \n", "pz2 | \n", "pt2 | \n", "eta2 | \n", "phi2 | \n", "Q2 | \n", "M | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "165617 | \n", "74601703 | \n", "G | \n", "9.69873 | \n", "-9.510430 | \n", "0.366205 | \n", "1.86329 | \n", "9.51748 | \n", "0.194546 | \n", "3.10311 | \n", "... | \n", "G | \n", "9.76332 | \n", "7.327710 | \n", "-1.152370 | \n", "6.34728 | \n", "7.41776 | \n", "0.775564 | \n", "-0.155984 | \n", "1 | \n", "17.49220 | \n", "
1 | \n", "165617 | \n", "75100943 | \n", "G | \n", "6.20385 | \n", "-4.266610 | \n", "0.456545 | \n", "-4.47930 | \n", "4.29097 | \n", "-0.912070 | \n", "3.03499 | \n", "... | \n", "G | \n", "9.66898 | \n", "7.273970 | \n", "-2.821120 | \n", "-5.71040 | \n", "7.80188 | \n", "-0.678625 | \n", "-0.369977 | \n", "1 | \n", "11.55340 | \n", "
2 | \n", "165617 | \n", "75587682 | \n", "G | \n", "19.28920 | \n", "-4.212080 | \n", "-0.651623 | \n", "18.81210 | \n", "4.26219 | \n", "2.190460 | \n", "-2.98811 | \n", "... | \n", "G | \n", "9.82439 | \n", "4.343940 | \n", "-0.473505 | \n", "8.79849 | \n", "4.36967 | \n", "1.449670 | \n", "-0.108575 | \n", "1 | \n", "9.16361 | \n", "
3 | \n", "165617 | \n", "75660978 | \n", "G | \n", "7.04268 | \n", "-6.326780 | \n", "-0.268545 | \n", "3.08025 | \n", "6.33248 | \n", "0.469033 | \n", "-3.09917 | \n", "... | \n", "G | \n", "5.58571 | \n", "4.474760 | \n", "0.848935 | \n", "-3.23185 | \n", "4.55458 | \n", "-0.660499 | \n", "0.187488 | \n", "1 | \n", "12.47740 | \n", "
4 | \n", "165617 | \n", "75947690 | \n", "G | \n", "7.27507 | \n", "0.102966 | \n", "-5.533080 | \n", "-4.72122 | \n", "5.53403 | \n", "-0.773616 | \n", "-1.55219 | \n", "... | \n", "G | \n", "7.31811 | \n", "-0.398831 | \n", "6.940810 | \n", "2.28247 | \n", "6.95226 | \n", "0.322677 | \n", "1.628190 | \n", "1 | \n", "14.31590 | \n", "
5 rows × 21 columns
\n", "\n", " | Run | \n", "Event | \n", "Type1 | \n", "E1 | \n", "px1 | \n", "py1 | \n", "pz1 | \n", "pt1 | \n", "eta1 | \n", "phi1 | \n", "... | \n", "Type2 | \n", "E2 | \n", "px2 | \n", "py2 | \n", "pz2 | \n", "pt2 | \n", "eta2 | \n", "phi2 | \n", "Q2 | \n", "M | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "165617 | \n", "74969122 | \n", "G | \n", "59.9226 | \n", "-46.15160 | \n", "29.4115 | \n", "-24.4070 | \n", "54.7266 | \n", "-0.432382 | \n", "2.574210 | \n", "... | \n", "G | \n", "52.4465 | \n", "30.10970 | \n", "-16.39890 | \n", "-39.68760 | \n", "34.2859 | \n", "-0.988511 | \n", "-0.498717 | \n", "-1 | \n", "89.9557 | \n", "
1 | \n", "165617 | \n", "75138253 | \n", "G | \n", "97.1011 | \n", "-23.61440 | \n", "6.6660 | \n", "-93.9497 | \n", "24.5372 | \n", "-2.052350 | \n", "2.866470 | \n", "... | \n", "G | \n", "30.5992 | \n", "-11.61340 | \n", "-25.98480 | \n", "11.23470 | \n", "28.4619 | \n", "0.385137 | \n", "-1.991090 | \n", "1 | \n", "88.6081 | \n", "
2 | \n", "165617 | \n", "75887636 | \n", "G | \n", "152.9720 | \n", "7.46565 | \n", "-30.7098 | \n", "-149.6710 | \n", "31.6042 | \n", "-2.259260 | \n", "-1.332320 | \n", "... | \n", "G | \n", "33.5835 | \n", "-9.28778 | \n", "28.74570 | \n", "-14.67190 | \n", "30.2089 | \n", "-0.468368 | \n", "1.883310 | \n", "1 | \n", "88.2438 | \n", "
3 | \n", "165617 | \n", "75833588 | \n", "G | \n", "181.8770 | \n", "44.14270 | \n", "-14.9498 | \n", "175.8040 | \n", "46.6055 | \n", "2.037920 | \n", "-0.326545 | \n", "... | \n", "G | \n", "170.0210 | \n", "-34.63010 | \n", "12.32480 | \n", "166.00000 | \n", "36.7579 | \n", "2.212820 | \n", "2.799670 | \n", "-1 | \n", "83.0943 | \n", "
4 | \n", "165617 | \n", "75779415 | \n", "G | \n", "50.2440 | \n", "37.80720 | \n", "-12.2044 | \n", "-30.7590 | \n", "39.7283 | \n", "-0.712422 | \n", "-0.312246 | \n", "... | \n", "G | \n", "49.2396 | \n", "-47.60640 | \n", "8.23376 | \n", "-9.50613 | \n", "48.3132 | \n", "-0.195513 | \n", "2.970330 | \n", "-1 | \n", "90.3544 | \n", "
5 rows × 21 columns
\n", "