{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "### Necessary imports" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "collapsed": true }, "outputs": [], "source": [ "# Importing the classes from 'gydelt'\n", "from gydelt.gydelt import GetData, ProcessData \n", "\n", "# Creating object of GetData\n", "GD = GetData()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### Reading from a file" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | Date | \n", "NumArticles | \n", "Counts | \n", "Themes | \n", "Locations | \n", "Persons | \n", "Organizations | \n", "ToneData | \n", "CAMEOEvents | \n", "Sources | \n", "SourceURLs | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "2016-12-01 | \n", "1 | \n", "NaN | \n", "DRONES;NATURAL_DISASTER;NATURAL_DISASTER_ICY;U... | \n", "2#California, United States#US#USCA#36.17#-119... | \n", "steve chien;andrew thompson | \n", "artificial intelligence group;propulsion labor... | \n", "-1.16279069767442,1.62790697674419,2.790697674... | \n", "NaN | \n", "sify.com | \n", "http://www.sify.com/news/nasas-intelligent-und... | \n", "
| 1 | \n", "2016-12-01 | \n", "1 | \n", "SEIZE#85##1#Ireland#EI#EI#53#-8#EI; | \n", "TAX_FNCACT;TAX_FNCACT_CHILD;RAPE;WB_2024_ANTI_... | \n", "1#Ireland#EI#EI#53#-8#EI;1#Germany#GM#GM#51#9#... | \n", "claudia peersman;awais rashid | \n", "p networks;german research centre for artifici... | \n", "-4.33815350389321,1.33481646273637,5.672969966... | \n", "604376665,604109997 | \n", "wired.co.uk | \n", "http://www.wired.co.uk/article/ai-interpol-tra... | \n", "
| 2 | \n", "2016-12-01 | \n", "1 | \n", "NaN | \n", "EPU_ECONOMY_HISTORIC;ECON_STOCKMARKET;EDUCATIO... | \n", "1#Japan#JA#JA#36#138#JA;4#Tokyo, Tokyo, Japan#... | \n", "tom foley | \n", "paxton center school;hampshire college in amhe... | \n", "4.13533834586466,5.26315789473684,1.1278195488... | \n", "604128888 | \n", "thelandmark.com | \n", "http://www.thelandmark.com/news/2016-12-01/Pax... | \n", "
| 3 | \n", "2016-12-01 | \n", "1 | \n", "NaN | \n", "UNGP_FORESTS_RIVERS_OCEANS;MEDIA_MSM;WB_566_EN... | \n", "3#Moss Landing, California, United States#US#U... | \n", "steve chien;andrew thompson | \n", "propulsion laboratory;net enterprises;monterey... | \n", "-1.03626943005181,2.2020725388601,3.2383419689... | \n", "604152212 | \n", "clarksvilleonline.com | \n", "http://www.clarksvilleonline.com/2016/12/01/na... | \n", "
| 4 | \n", "2016-12-01 | \n", "1 | \n", "NaN | \n", "DRONES;NATURAL_DISASTER;NATURAL_DISASTER_ICY;U... | \n", "2#California, United States#US#USCA#36.17#-119... | \n", "andrew thompson;steve chien | \n", "artificial intelligence group;propulsion labor... | \n", "-1.30548302872063,2.088772845953,3.39425587467... | \n", "NaN | \n", "newkerala.com | \n", "http://www.newkerala.com/news/2016/fullnews-14... | \n", "
| \n", " | Date | \n", "NumArticles | \n", "Counts | \n", "Themes | \n", "Locations | \n", "Persons | \n", "Organizations | \n", "ToneData | \n", "CAMEOEvents | \n", "Sources | \n", "SourceURLs | \n", "Countries | \n", "Tone | \n", "Positive Score | \n", "Negative Score | \n", "Polarity | \n", "Activity Reference Density | \n", "Self/Group Reference Density | \n", "Word Count | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "2016-12-01 | \n", "1 | \n", "NaN | \n", "DRONES;NATURAL_DISASTER;NATURAL_DISASTER_ICY;U... | \n", "2#California, United States#US#USCA#36.17#-119... | \n", "steve chien;andrew thompson | \n", "artificial intelligence group;propulsion labor... | \n", "-1.16279069767442,1.62790697674419,2.790697674... | \n", "NaN | \n", "sify.com | \n", "http://www.sify.com/news/nasas-intelligent-und... | \n", "United States | \n", "-1.162791 | \n", "1.627907 | \n", "2.790698 | \n", "4.418605 | \n", "24.186047 | \n", "1.162791 | \n", "None | \n", "
| 1 | \n", "2016-12-01 | \n", "1 | \n", "SEIZE#85##1#Ireland#EI#EI#53#-8#EI; | \n", "TAX_FNCACT;TAX_FNCACT_CHILD;RAPE;WB_2024_ANTI_... | \n", "1#Ireland#EI#EI#53#-8#EI;1#Germany#GM#GM#51#9#... | \n", "claudia peersman;awais rashid | \n", "p networks;german research centre for artifici... | \n", "-4.33815350389321,1.33481646273637,5.672969966... | \n", "604376665,604109997 | \n", "wired.co.uk | \n", "http://www.wired.co.uk/article/ai-interpol-tra... | \n", "Ireland;France;Germany | \n", "-4.338154 | \n", "1.334816 | \n", "5.672970 | \n", "7.007786 | \n", "21.357063 | \n", "0.556174 | \n", "None | \n", "
| 2 | \n", "2016-12-01 | \n", "1 | \n", "NaN | \n", "EPU_ECONOMY_HISTORIC;ECON_STOCKMARKET;EDUCATIO... | \n", "1#Japan#JA#JA#36#138#JA;4#Tokyo, Tokyo, Japan#... | \n", "tom foley | \n", "paxton center school;hampshire college in amhe... | \n", "4.13533834586466,5.26315789473684,1.1278195488... | \n", "604128888 | \n", "thelandmark.com | \n", "http://www.thelandmark.com/news/2016-12-01/Pax... | \n", "Japan | \n", "4.135338 | \n", "5.263158 | \n", "1.127820 | \n", "6.390977 | \n", "25.939850 | \n", "0.751880 | \n", "None | \n", "
| 3 | \n", "2016-12-01 | \n", "1 | \n", "NaN | \n", "UNGP_FORESTS_RIVERS_OCEANS;MEDIA_MSM;WB_566_EN... | \n", "3#Moss Landing, California, United States#US#U... | \n", "steve chien;andrew thompson | \n", "propulsion laboratory;net enterprises;monterey... | \n", "-1.03626943005181,2.2020725388601,3.2383419689... | \n", "604152212 | \n", "clarksvilleonline.com | \n", "http://www.clarksvilleonline.com/2016/12/01/na... | \n", "United States;France | \n", "-1.036269 | \n", "2.202073 | \n", "3.238342 | \n", "5.440415 | \n", "25.259067 | \n", "1.683938 | \n", "None | \n", "
| 4 | \n", "2016-12-01 | \n", "1 | \n", "NaN | \n", "DRONES;NATURAL_DISASTER;NATURAL_DISASTER_ICY;U... | \n", "2#California, United States#US#USCA#36.17#-119... | \n", "andrew thompson;steve chien | \n", "artificial intelligence group;propulsion labor... | \n", "-1.30548302872063,2.088772845953,3.39425587467... | \n", "NaN | \n", "newkerala.com | \n", "http://www.newkerala.com/news/2016/fullnews-14... | \n", "United States | \n", "-1.305483 | \n", "2.088773 | \n", "3.394256 | \n", "5.483029 | \n", "25.587467 | \n", "1.827676 | \n", "None | \n", "
| \n", " | Date | \n", "NumArticles | \n", "Counts | \n", "Themes | \n", "Locations | \n", "Persons | \n", "Organizations | \n", "ToneData | \n", "CAMEOEvents | \n", "Sources | \n", "... | \n", "United Kingdom | \n", "United States | \n", "Uruguay | \n", "Uzbekistan | \n", "Venezuela | \n", "Vietnam | \n", "Western Sahara | \n", "Yemen | \n", "Zambia | \n", "Zimbabwe | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "2016-12-01 | \n", "1 | \n", "NaN | \n", "DRONES;NATURAL_DISASTER;NATURAL_DISASTER_ICY;U... | \n", "2#California, United States#US#USCA#36.17#-119... | \n", "steve chien;andrew thompson | \n", "artificial intelligence group;propulsion labor... | \n", "-1.16279069767442,1.62790697674419,2.790697674... | \n", "NaN | \n", "sify.com | \n", "... | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
| 1 | \n", "2016-12-01 | \n", "1 | \n", "SEIZE#85##1#Ireland#EI#EI#53#-8#EI; | \n", "TAX_FNCACT;TAX_FNCACT_CHILD;RAPE;WB_2024_ANTI_... | \n", "1#Ireland#EI#EI#53#-8#EI;1#Germany#GM#GM#51#9#... | \n", "claudia peersman;awais rashid | \n", "p networks;german research centre for artifici... | \n", "-4.33815350389321,1.33481646273637,5.672969966... | \n", "604376665,604109997 | \n", "wired.co.uk | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
| 2 | \n", "2016-12-01 | \n", "1 | \n", "NaN | \n", "EPU_ECONOMY_HISTORIC;ECON_STOCKMARKET;EDUCATIO... | \n", "1#Japan#JA#JA#36#138#JA;4#Tokyo, Tokyo, Japan#... | \n", "tom foley | \n", "paxton center school;hampshire college in amhe... | \n", "4.13533834586466,5.26315789473684,1.1278195488... | \n", "604128888 | \n", "thelandmark.com | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
| 3 | \n", "2016-12-01 | \n", "1 | \n", "NaN | \n", "UNGP_FORESTS_RIVERS_OCEANS;MEDIA_MSM;WB_566_EN... | \n", "3#Moss Landing, California, United States#US#U... | \n", "steve chien;andrew thompson | \n", "propulsion laboratory;net enterprises;monterey... | \n", "-1.03626943005181,2.2020725388601,3.2383419689... | \n", "604152212 | \n", "clarksvilleonline.com | \n", "... | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
| 4 | \n", "2016-12-01 | \n", "1 | \n", "NaN | \n", "DRONES;NATURAL_DISASTER;NATURAL_DISASTER_ICY;U... | \n", "2#California, United States#US#USCA#36.17#-119... | \n", "andrew thompson;steve chien | \n", "artificial intelligence group;propulsion labor... | \n", "-1.30548302872063,2.088772845953,3.39425587467... | \n", "NaN | \n", "newkerala.com | \n", "... | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
5 rows × 154 columns
\n", "| \n", " | Date | \n", "NumArticles | \n", "Counts | \n", "Themes | \n", "Locations | \n", "Persons | \n", "Organizations | \n", "ToneData | \n", "CAMEOEvents | \n", "Sources | \n", "... | \n", "United Kingdom | \n", "United States | \n", "Uruguay | \n", "Uzbekistan | \n", "Venezuela | \n", "Vietnam | \n", "Western Sahara | \n", "Yemen | \n", "Zambia | \n", "Zimbabwe | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 48 | \n", "2016-12-03 | \n", "1 | \n", "NaN | \n", "GENERAL_GOVERNMENT;SOVEREIGNTY;TAX_FNCACT;TAX_... | \n", "1#Vietnam, Republic Of#VM#VM#16#106#VM;4#Dongh... | \n", "marco polo;longji dragon;zonghe guangbo jiaoto... | \n", "artificial intelligence laboratory;google;inst... | \n", "1.01102104016759,2.36815739138355,1.3571363512... | \n", "NaN | \n", "wn.com | \n", "... | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
| 138 | \n", "2016-12-12 | \n", "1 | \n", "NaN | \n", "TAX_FNCACT;TAX_FNCACT_LEADER;ENV_OIL;TAX_ECON_... | \n", "1#China#CH#CH#35#105#CH;1#Mexico#MX#MX#23#-102... | \n", "unknown | \n", "broadcom;ericsson;ibm;facebook;visa;artificial... | \n", "1.36570561456753,3.33839150227618,1.9726858877... | \n", "NaN | \n", "sharesinv.com | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
| 165 | \n", "2016-12-14 | \n", "1 | \n", "NaN | \n", "unknown | \n", "3#University Of Louisville, Kentucky, United S... | \n", "deepmind alphago;demis hassabis;david kenny;jo... | \n", "houston methodist research institute;cybersecu... | \n", "0.916380297823597,3.55097365406644,2.634593356... | \n", "NaN | \n", "techrepublic.com | \n", "... | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
| 214 | \n", "2016-12-19 | \n", "1 | \n", "NaN | \n", "TECH_AUTOMATION;WB_1921_PRIVATE_SECTOR_DEVELOP... | \n", "1#China#CH#CH#35#105#CH;2#New York, United Sta... | \n", "paul allen;jon talton;bill gates | \n", "boeing;allen institute for artificial intellig... | \n", "-0.900900900900901,2.5025025025025,3.403403403... | \n", "609815768,609817195,609817718,609649509 | \n", "crosscut.com | \n", "... | \n", "NaN | \n", "1.0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
| 231 | \n", "2016-12-21 | \n", "1 | \n", "NaN | \n", "unknown | \n", "1#United States#US#US#38#-97#US;1#China#CH#CH#... | \n", "baidu facebook;gabriele ketterl | \n", "ibm;united states artificial intelligence mach... | \n", "0.809716599190283,3.96761133603239,3.157894736... | \n", "NaN | \n", "openpr.com | \n", "... | \n", "1.0 | \n", "1.0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
5 rows × 154 columns
\n", "