{ "cells": [ { "metadata": { "trusted": true }, "cell_type": "code", "source": "from pyspark import SparkContext, SparkConf", "execution_count": 18, "outputs": [] }, { "metadata": { "trusted": true }, "cell_type": "code", "source": "from pyspark import SparkContext, SparkConf", "execution_count": 20, "outputs": [] }, { "metadata": { "trusted": true }, "cell_type": "code", "source": "conf = SparkConf().setAppName('pyspark')", "execution_count": 21, "outputs": [] }, { "metadata": { "trusted": true }, "cell_type": "code", "source": "sc = SparkContext(conf=conf)", "execution_count": 22, "outputs": [] }, { "metadata": { "trusted": true }, "cell_type": "code", "source": "# General:\nimport sys\nimport tweepy # To consume Twitter's API\nimport re\nimport math\nimport numpy as np\nsc", "execution_count": 23, "outputs": [ { "output_type": "execute_result", "execution_count": 23, "data": { "text/html": "\n
\n ", "text/plain": "