{
"cells": [
{
"cell_type": "markdown",
"id": "bf1b03a9-4aeb-43dd-870f-b8630151a247",
"metadata": {},
"source": [
"# Stock Prediction Deep Learning Model with Sentiment Analysis\n",
"\n",
"##### I will be testing the LSTM only and then the LSTM with Sentiment Analysis."
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "eb97a1b2-770f-4e5e-b944-bc44aa6e9243",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Num GPUs Available: 1\n"
]
}
],
"source": [
"# Last updated: 10/18/2023.\n",
"# Copyright 2023 Shane Khalid. All Rights Reserved.\n",
"#\n",
"# Licensed under the Apache License, Version 2.0 (the \"License\");\n",
"# you may not use this file except in compliance with the License.\n",
"# You may obtain a copy of the License at\n",
"#\n",
"# http://www.apache.org/licenses/LICENSE-2.0\n",
"#\n",
"# Unless required by applicable law or agreed to in writing, software\n",
"# distributed under the License is distributed on an \"AS IS\" BASIS,\n",
"# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\n",
"# See the License for the specific language governing permissions and\n",
"# limitations under the License.\n",
"# ==============================================================================\n",
"\n",
"\n",
"import math \n",
"import time\n",
"import numpy as np\n",
"import pandas as pd\n",
"import seaborn as sns\n",
"import matplotlib.pyplot as plt\n",
"import matplotlib.dates as mdates\n",
"import tensorflow as tf\n",
"from keras.models import Sequential\n",
"from keras.callbacks import EarlyStopping\n",
"from keras.layers import LSTM, Dense, Dropout\n",
"from datetime import date, timedelta, datetime\n",
"from pandas.plotting import register_matplotlib_converters\n",
"from sklearn.preprocessing import RobustScaler, MinMaxScaler\n",
"from sklearn.metrics import mean_absolute_error, mean_squared_error\n",
"from tensorflow.keras import utils\n",
"# Always use the GPU\n",
"print(\"Num GPUs Available: \", len(tf.config.experimental.list_physical_devices('GPU')))\n",
"import os\n",
"import csv\n",
"import json\n",
"import datetime\n",
"import pandas as pd\n",
"from tqdm import tqdm\n",
"import snscrape.modules.twitter as sntwitter\n",
"from datetime import datetime"
]
},
{
"cell_type": "markdown",
"id": "a830f253-822d-400d-953c-3b01ab057f66",
"metadata": {},
"source": [
"### Loading Dataset\n",
"\n",
"##### This time I will be importing (scraping) from Yahoo Finance. "
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "dae01ef7-9acd-4671-987c-9dc582af0bbc",
"metadata": {},
"outputs": [],
"source": [
"# Downloading hostorical stock price data from 1st Jan 2010 to today\n",
"stockname = 'GOOG'\n",
"interval = '1d' \n",
"date_today = date.today()\n",
"date_start = datetime.strptime('2010-01-01', \"%Y-%m-%d\")\n",
"\n",
"period1 = int(time.mktime(date_start.timetuple()))\n",
"period2 = int(time.mktime(date_today.timetuple()))\n",
"query_string = f'https://query1.finance.yahoo.com/v7/finance/download/{stockname}?period1={period1}&period2={period2}&interval={interval}&events=history&includeAdjustedClose=true'\n",
"\n",
"# Saving data to CSV file\n",
"stocks_data = pd.read_csv(query_string)\n",
"stocks_data.to_csv(stockname + '.csv')\n",
"\n",
"# Loading data into dataframe\n",
"df = pd.read_csv(stockname + '.csv',parse_dates = True,index_col=['Date'])\n",
"df = df.drop(['Unnamed: 0'],axis=1)"
]
},
{
"cell_type": "markdown",
"id": "8d2dbb84-4fbc-46b7-a401-5172a4ab0504",
"metadata": {},
"source": [
"### EDA"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "f4412171-e5b0-4c7f-9053-b8bdad4983b2",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"
\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" Open | \n",
" High | \n",
" Low | \n",
" Close | \n",
" Adj Close | \n",
" Volume | \n",
"
\n",
" \n",
" Date | \n",
" | \n",
" | \n",
" | \n",
" | \n",
" | \n",
" | \n",
"
\n",
" \n",
" \n",
" \n",
" 2010-01-04 | \n",
" 15.615220 | \n",
" 15.678981 | \n",
" 15.547723 | \n",
" 15.610239 | \n",
" 15.610239 | \n",
" 78541293 | \n",
"
\n",
" \n",
" 2010-01-05 | \n",
" 15.620949 | \n",
" 15.637387 | \n",
" 15.480475 | \n",
" 15.541497 | \n",
" 15.541497 | \n",
" 120638494 | \n",
"
\n",
" \n",
" 2010-01-06 | \n",
" 15.588072 | \n",
" 15.588072 | \n",
" 15.102393 | \n",
" 15.149715 | \n",
" 15.149715 | \n",
" 159744526 | \n",
"
\n",
" \n",
" 2010-01-07 | \n",
" 15.178109 | \n",
" 15.193053 | \n",
" 14.760922 | \n",
" 14.797037 | \n",
" 14.797037 | \n",
" 257533695 | \n",
"
\n",
" \n",
" 2010-01-08 | \n",
" 14.744733 | \n",
" 15.024933 | \n",
" 14.672753 | \n",
" 14.994298 | \n",
" 14.994298 | \n",
" 189680313 | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" Open High Low Close Adj Close Volume\n",
"Date \n",
"2010-01-04 15.615220 15.678981 15.547723 15.610239 15.610239 78541293\n",
"2010-01-05 15.620949 15.637387 15.480475 15.541497 15.541497 120638494\n",
"2010-01-06 15.588072 15.588072 15.102393 15.149715 15.149715 159744526\n",
"2010-01-07 15.178109 15.193053 14.760922 14.797037 14.797037 257533695\n",
"2010-01-08 14.744733 15.024933 14.672753 14.994298 14.994298 189680313"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df.head()"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "439ae221-db11-42b5-aa27-d5847a24fc5c",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "",
"text/plain": [
""
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# Plotting line charts\n",
"df_plot = df.copy()\n",
"list_length = df_plot.shape[1]\n",
"ncols = 2\n",
"nrows = int(round(list_length / ncols, 0))\n",
"fig, ax = plt.subplots(nrows=nrows, ncols=ncols, sharex=True, figsize=(14, 7))\n",
"fig.subplots_adjust(hspace=0.5, wspace=0.5)\n",
"colors = ['blue', 'red', 'green', 'pink', 'orange', 'purple']\n",
"for i in range(0, list_length):\n",
" ax = plt.subplot(nrows,ncols,i+1)\n",
" sns.lineplot(data = df_plot.iloc[:, i], ax=ax, color= colors[i])\n",
" ax.set_title(df_plot.columns[i])\n",
" ax.tick_params(axis=\"x\", rotation=30, labelsize=10, length=0)\n",
" ax.xaxis.set_major_locator(mdates.AutoDateLocator())\n",
"\n",
"fig.tight_layout()\n",
"plt.show()"
]
},
{
"cell_type": "markdown",
"id": "847927f0-10a2-4b70-8a06-7ea57090509c",
"metadata": {},
"source": [
"### Preprocessing Data"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "217b1fdb-52f6-4673-b78d-b93e64d34544",
"metadata": {},
"outputs": [],
"source": [
"# Creating n samples, sequence_length time steps per samples\n",
"def splitData(sequence_length, data, index_Close):\n",
" x, y = [], []\n",
" data_len = data.shape[0]\n",
" for i in range(sequence_length, data_len):\n",
" #contains sequence_length values 0-sequence_length * columns\n",
" x.append(data[i-sequence_length:i,:]) \n",
" #contains the prediction values for validation, for single-step prediction\n",
" y.append(data[i, index_Close]) \n",
" # Convert the x & y to numpy arrays\n",
" x = np.array(x)\n",
" y = np.array(y)\n",
" return x, y\n",
"\n",
"def processData(df, FEATURES):\n",
" # Indexing the batches\n",
" train_df = df.sort_values(by=['Date']).copy()\n",
" # Saving a copy of the dates' index, before we need to reset it to numbers\n",
" date_index = train_df.index\n",
" # Reset the index, so we can convert the date-index to a number-index\n",
" train_df = train_df.reset_index(drop=True).copy()\n",
" # Create the dataset with features and filter the data to the list of FEATURES\n",
" data = pd.DataFrame(train_df)\n",
" data_filtered = data[FEATURES]\n",
"\n",
" # Adding a prediction column (target variable) and setting dummy values to prepare the data for scaling\n",
" data_filtered_ext = data_filtered.copy()\n",
" data_filtered_ext['Prediction'] = data_filtered_ext['Close']\n",
" # Number of rows in the data\n",
" nrows = data_filtered.shape[0]\n",
" # Convert data to numpy values\n",
" np_data_unscaled = np.array(data_filtered)\n",
" np_data = np.reshape(np_data_unscaled, (nrows, -1))\n",
"\n",
" # Transform the data by scaling each feature to a range between 0 and 1\n",
" scaler = MinMaxScaler()\n",
" np_data_scaled = scaler.fit_transform(np_data_unscaled)\n",
" # Creating a separate scaler that works on a single column for scaling predictions\n",
" scaler_pred = MinMaxScaler()\n",
" df_Close = pd.DataFrame(data_filtered_ext['Close'])\n",
" np_Close_scaled = scaler_pred.fit_transform(df_Close)\n",
"\n",
" # sequence length: this is the timeframe used to make a single prediction\n",
" sequence_length = 50\n",
" # Prediction Index\n",
" index_Close = data.columns.get_loc(\"Close\")\n",
" # Split the training data into train and test datasets with 80:20 split \n",
" train_data_len = math.ceil(np_data_scaled.shape[0] * 0.8)\n",
" # Creating the training and test data\n",
" train_data = np_data_scaled[0:train_data_len, :]\n",
" test_data = np_data_scaled[train_data_len - sequence_length:, :]\n",
"\n",
" # Generate training data and test data\n",
" x_train, y_train = splitData(sequence_length, train_data, index_Close)\n",
" x_test, y_test = splitData(sequence_length, test_data, index_Close)\n",
"\n",
" return x_train, y_train, x_test, y_test, data_filtered, \\\n",
" date_index, scaler, scaler_pred, train_data_len, sequence_length"
]
},
{
"cell_type": "markdown",
"id": "60add952-ca35-487f-bc5b-3fbe5558c4c8",
"metadata": {},
"source": [
"### Train LSTM model\n",
"\n",
"##### Same as usual. Adam optimizer. "
]
},
{
"cell_type": "code",
"execution_count": 10,
"id": "88c6193d-4946-4f19-ae55-cf5bfe6707f0",
"metadata": {},
"outputs": [],
"source": [
"# Setting up LSTM model architecture\n",
"\n",
"def getModel(x_train):\n",
" # Creating model with n_neurons = inputshape Timestamps, each with x_train.shape[2] variables\n",
" model = Sequential()\n",
" n_neurons = x_train.shape[1] * x_train.shape[2]\n",
" model.add(LSTM(n_neurons, return_sequences=True, input_shape=(x_train.shape[1], x_train.shape[2]))) \n",
" model.add(LSTM(n_neurons, return_sequences=False))\n",
" model.add(Dense(5))\n",
" model.add(Dense(1))\n",
"\n",
" # Compiling the model\n",
" model.compile(optimizer='adam', loss='mse')\n",
" return model"
]
},
{
"cell_type": "code",
"execution_count": 11,
"id": "e0dd7500-3179-4691-aee6-7d51ae1cdda1",
"metadata": {},
"outputs": [],
"source": [
"def plotLossCurve(history, color, title):\n",
" # Plot the Loss Curve\n",
" fig, ax = plt.subplots(figsize=(7, 6), sharex=True)\n",
" plt.plot(history.history[\"loss\"],color=color)\n",
" plt.title(title)\n",
" plt.ylabel(\"Loss\")\n",
" plt.xlabel(\"Epoch\")\n",
" plt.xticks(rotation=45)\n",
" plt.legend([\"Train\", \"Test\"], loc=\"upper left\")\n",
" plt.show()"
]
},
{
"cell_type": "markdown",
"id": "445d8322-15b5-4a58-be0f-323fd901a9a7",
"metadata": {},
"source": [
"### Evaluate Model Performance"
]
},
{
"cell_type": "code",
"execution_count": 12,
"id": "a8ae2151-be7f-4572-9c80-2f45fe25979b",
"metadata": {},
"outputs": [],
"source": [
"def eval(model, x_test, y_test, scaler_pred):\n",
" # Get the predicted values\n",
" y_pred_scaled = model.predict(x_test)\n",
" # Unscale the predicted values\n",
" y_pred = scaler_pred.inverse_transform(y_pred_scaled)\n",
" y_test_unscaled = scaler_pred.inverse_transform(y_test.reshape(-1, 1))\n",
"\n",
" # Mean Absolute Error (MAE)\n",
" MAE = mean_absolute_error(y_test_unscaled, y_pred)\n",
" print(f'Median Absolute Error (MAE): {np.round(MAE, 2)}')\n",
"\n",
" # Mean Absolute Percentage Error (MAPE)\n",
" MAPE = np.mean((np.abs(np.subtract(y_test_unscaled, y_pred)/ y_test_unscaled))) * 100\n",
" print(f'Mean Absolute Percentage Error (MAPE): {np.round(MAPE, 2)} %')\n",
"\n",
" # Median Absolute Percentage Error (MDAPE)\n",
" MDAPE = np.median((np.abs(np.subtract(y_test_unscaled, y_pred)/ y_test_unscaled)) ) * 100\n",
" print(f'Median Absolute Percentage Error (MDAPE): {np.round(MDAPE, 2)} %')\n",
"\n",
" return MAE, MAPE, MDAPE, y_pred"
]
},
{
"cell_type": "markdown",
"id": "c9dee881-880e-4851-af06-275de1c88089",
"metadata": {},
"source": [
"### Visualize"
]
},
{
"cell_type": "code",
"execution_count": 13,
"id": "2fd57b78-c270-49cd-ae74-56caa4477e18",
"metadata": {},
"outputs": [],
"source": [
"def visualizePreds(data_filtered, train_data_len, y_pred, date_index, color):\n",
" # The date from which on the date is displayed\n",
" display_start_date = pd.Timestamp('today') - timedelta(days=500)\n",
" # Add the date column\n",
" data_filtered_sub = data_filtered.copy()\n",
" data_filtered_sub['Date'] = date_index\n",
"\n",
" # Add the difference between the valid and predicted prices\n",
" train = data_filtered_sub[:train_data_len + 1]\n",
" valid = data_filtered_sub[train_data_len:]\n",
" \n",
" valid.insert(1, \"Prediction\", y_pred.ravel(), True)\n",
" valid.insert(1, \"Difference\", valid[\"Prediction\"] - valid[\"Close\"], True)\n",
" # Zoom in to a closer timeframe\n",
" valid = valid[valid['Date'] > display_start_date]\n",
" train = train[train['Date'] > display_start_date]\n",
" \n",
" # Visualize the data\n",
" fig, ax1 = plt.subplots(figsize=(10, 7), sharex=True)\n",
" xt = train['Date']; yt = train[[\"Close\"]]\n",
" xv = valid['Date']; yv = valid[[\"Close\", \"Prediction\"]]\n",
" plt.title(\"Predictions vs Actual Values\", fontsize=20)\n",
" plt.ylabel(stockname, fontsize=18)\n",
" plt.plot(xt, yt, color=\"green\", linewidth=2.0)\n",
" plt.plot(xv, yv[\"Prediction\"], color=color, linewidth=2.0)\n",
" plt.plot(xv, yv[\"Close\"], color=\"black\", linewidth=2.0)\n",
" plt.legend([\"Train\", \"Test Predictions\", \"Actual Values\"], loc=\"upper left\")\n",
" plt.show()"
]
},
{
"cell_type": "markdown",
"id": "b217a05e-7ac9-4160-947a-3d4dcf779ce7",
"metadata": {},
"source": [
"### Predict tomorrow's price"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "e13ad85b-663e-462f-90ad-b54bed486051",
"metadata": {},
"outputs": [],
"source": [
"def predictFuturePrice(model, df, sequence_length, feats, scaler, scaler_pred):\n",
" df_temp = df[-sequence_length:]\n",
" new_df = df_temp.filter(feats)\n",
" N = sequence_length\n",
" # Get the last N day closing price values and scale the data to be values between 0 and 1\n",
" last_N_days = new_df[-sequence_length:].values\n",
" last_N_days_scaled = scaler.transform(last_N_days)\n",
"\n",
" # Create an empty list and Append past N days\n",
" X_test_new = []\n",
" X_test_new.append(last_N_days_scaled)\n",
" # Convert the X_test data set to a numpy array and reshape the data\n",
" pred_price_scaled = model.predict(np.array(X_test_new))\n",
" pred_price_unscaled = scaler_pred.inverse_transform(pred_price_scaled.reshape(-1, 1))\n",
" # Print last price and predicted price for the next day\n",
" price_today = np.round(new_df['Close'][-1], 2)\n",
" predicted_price = np.round(pred_price_unscaled.ravel()[0], 2)\n",
" change_percent = np.round(100 - (price_today * 100)/predicted_price, 2)\n",
"\n",
" plus = '+'; minus = ''\n",
" print(f'The close price for {stockname} at {date_today} was {price_today}')\n",
" print(f'The predicted close price is {predicted_price} ({plus if change_percent > 0 else minus}{change_percent}%)')"
]
},
{
"cell_type": "markdown",
"id": "f75d1329-a3b7-4630-948d-1fbf2358b983",
"metadata": {},
"source": [
"### LSTM without Sentiment Analysis"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "22157680-4bf2-43c9-bd82-1f895063a270",
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"2023-10-19 17:27:27.723503: I tensorflow/compiler/xla/stream_executor/cuda/cuda_gpu_executor.cc:880] could not open file to read NUMA node: /sys/bus/pci/devices/0000:43:00.0/numa_node\n",
"Your kernel may have been built without NUMA support.\n",
"2023-10-19 17:27:27.723609: I tensorflow/compiler/xla/stream_executor/cuda/cuda_gpu_executor.cc:880] could not open file to read NUMA node: /sys/bus/pci/devices/0000:43:00.0/numa_node\n",
"Your kernel may have been built without NUMA support.\n",
"2023-10-19 17:27:27.723648: I tensorflow/compiler/xla/stream_executor/cuda/cuda_gpu_executor.cc:880] could not open file to read NUMA node: /sys/bus/pci/devices/0000:43:00.0/numa_node\n",
"Your kernel may have been built without NUMA support.\n",
"2023-10-19 17:27:28.951549: I tensorflow/compiler/xla/stream_executor/cuda/cuda_gpu_executor.cc:880] could not open file to read NUMA node: /sys/bus/pci/devices/0000:43:00.0/numa_node\n",
"Your kernel may have been built without NUMA support.\n",
"2023-10-19 17:27:28.951619: I tensorflow/compiler/xla/stream_executor/cuda/cuda_gpu_executor.cc:880] could not open file to read NUMA node: /sys/bus/pci/devices/0000:43:00.0/numa_node\n",
"Your kernel may have been built without NUMA support.\n",
"2023-10-19 17:27:28.951627: I tensorflow/core/common_runtime/gpu/gpu_device.cc:1977] Could not identify NUMA node of platform GPU id 0, defaulting to 0. Your kernel may not have been built with NUMA support.\n",
"2023-10-19 17:27:28.951697: I tensorflow/compiler/xla/stream_executor/cuda/cuda_gpu_executor.cc:880] could not open file to read NUMA node: /sys/bus/pci/devices/0000:43:00.0/numa_node\n",
"Your kernel may have been built without NUMA support.\n",
"2023-10-19 17:27:28.951724: I tensorflow/core/common_runtime/gpu/gpu_device.cc:1886] Created device /job:localhost/replica:0/task:0/device:GPU:0 with 21080 MB memory: -> device: 0, name: NVIDIA GeForce RTX 3090 Ti, pci bus id: 0000:43:00.0, compute capability: 8.6\n",
"2023-10-19 17:31:22.443601: I tensorflow/tsl/platform/default/subprocess.cc:304] Start cannot spawn child process: No such file or directory\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"You must install pydot (`pip install pydot`) and install graphviz (see instructions at https://graphviz.gitlab.io/download/) for plot_model to work.\n",
"Num GPUs Available: 1\n",
"Defaulting to user installation because normal site-packages is not writeable\n",
"Requirement already satisfied: pydot in ./.local/lib/python3.10/site-packages (1.4.2)\n",
"Requirement already satisfied: pyparsing>=2.1.4 in /usr/lib/python3/dist-packages (from pydot) (2.4.7)\n",
"Defaulting to user installation because normal site-packages is not writeable\n",
"Requirement already satisfied: graphviz in ./.local/lib/python3.10/site-packages (0.20.1)\n"
]
}
],
"source": [
"# List of considered features\n",
"features1 = ['High', 'Low', 'Open', 'Close', 'Volume'] \n",
"# Split and process dataset\n",
"x_train1, y_train1, x_test1, y_test1, data_filtered1, date_index1, \\\n",
"scaler1, scaler_pred1, train_data_len1, sequence_length1 = processData(df, features1)\n",
"# Get Model\n",
"model1 = getModel(x_train1)\n",
"#Visualizing Model Architecture\n",
"import tensorflow as tf\n",
"tf.keras.utils.plot_model(model1, show_shapes=True)\n",
"print(\"Num GPUs Available: \", len(tf.config.experimental.list_physical_devices('GPU')))\n",
"\n",
"!pip3 install pydot\n",
"!pip3 install graphviz"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "19ce2cc3-a825-42d7-a5a0-07fb82cb7aea",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Model: \"sequential\"\n",
"_________________________________________________________________\n",
" Layer (type) Output Shape Param # \n",
"=================================================================\n",
" lstm (LSTM) (None, 50, 250) 256000 \n",
" \n",
" lstm_1 (LSTM) (None, 250) 501000 \n",
" \n",
" dense (Dense) (None, 5) 1255 \n",
" \n",
" dense_1 (Dense) (None, 1) 6 \n",
" \n",
"=================================================================\n",
"Total params: 758261 (2.89 MB)\n",
"Trainable params: 758261 (2.89 MB)\n",
"Non-trainable params: 0 (0.00 Byte)\n",
"_________________________________________________________________\n"
]
}
],
"source": [
"model1.summary()"
]
},
{
"cell_type": "code",
"execution_count": 33,
"id": "adf10162-a17a-4225-bd2b-8b9b31f1057b",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Epoch 1/300\n",
"6/6 [==============================] - 0s 36ms/step - loss: 5.1939e-05 - val_loss: 5.8007e-04\n",
"Epoch 2/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.1459e-05 - val_loss: 6.0817e-04\n",
"Epoch 3/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.6616e-05 - val_loss: 5.9028e-04\n",
"Epoch 4/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.9010e-05 - val_loss: 8.4292e-04\n",
"Epoch 5/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 6.1818e-05 - val_loss: 5.7464e-04\n",
"Epoch 6/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.3029e-05 - val_loss: 5.6822e-04\n",
"Epoch 7/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.1655e-05 - val_loss: 5.7920e-04\n",
"Epoch 8/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.0274e-05 - val_loss: 5.6693e-04\n",
"Epoch 9/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 5.1249e-05 - val_loss: 5.5994e-04\n",
"Epoch 10/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.0582e-05 - val_loss: 5.6805e-04\n",
"Epoch 11/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.1368e-05 - val_loss: 5.7401e-04\n",
"Epoch 12/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 5.1662e-05 - val_loss: 5.5698e-04\n",
"Epoch 13/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 5.4154e-05 - val_loss: 5.5627e-04\n",
"Epoch 14/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 5.2049e-05 - val_loss: 6.3676e-04\n",
"Epoch 15/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.1783e-05 - val_loss: 5.7822e-04\n",
"Epoch 16/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.9757e-05 - val_loss: 5.7506e-04\n",
"Epoch 17/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.9588e-05 - val_loss: 5.7315e-04\n",
"Epoch 18/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.0603e-05 - val_loss: 5.9778e-04\n",
"Epoch 19/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 5.1515e-05 - val_loss: 5.5057e-04\n",
"Epoch 20/300\n",
"6/6 [==============================] - 0s 37ms/step - loss: 5.0911e-05 - val_loss: 5.9532e-04\n",
"Epoch 21/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 5.0137e-05 - val_loss: 5.9072e-04\n",
"Epoch 22/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.8706e-05 - val_loss: 5.4667e-04\n",
"Epoch 23/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.8973e-05 - val_loss: 5.4473e-04\n",
"Epoch 24/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.8683e-05 - val_loss: 5.7136e-04\n",
"Epoch 25/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.0623e-05 - val_loss: 6.3984e-04\n",
"Epoch 26/300\n",
"6/6 [==============================] - 0s 30ms/step - loss: 6.0414e-05 - val_loss: 8.6026e-04\n",
"Epoch 27/300\n",
"6/6 [==============================] - 0s 30ms/step - loss: 6.5069e-05 - val_loss: 6.3403e-04\n",
"Epoch 28/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 6.5269e-05 - val_loss: 8.0473e-04\n",
"Epoch 29/300\n",
"6/6 [==============================] - 0s 30ms/step - loss: 6.5151e-05 - val_loss: 6.2235e-04\n",
"Epoch 30/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 6.0876e-05 - val_loss: 8.0697e-04\n",
"Epoch 31/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 6.1552e-05 - val_loss: 6.3418e-04\n",
"Epoch 32/300\n",
"6/6 [==============================] - 0s 30ms/step - loss: 5.7528e-05 - val_loss: 5.2875e-04\n",
"Epoch 33/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 5.5271e-05 - val_loss: 6.4730e-04\n",
"Epoch 34/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 5.1992e-05 - val_loss: 7.8030e-04\n",
"Epoch 35/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 5.5727e-05 - val_loss: 5.3203e-04\n",
"Epoch 36/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.5673e-05 - val_loss: 6.3177e-04\n",
"Epoch 37/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.1613e-05 - val_loss: 5.2338e-04\n",
"Epoch 38/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 5.0783e-05 - val_loss: 5.8298e-04\n",
"Epoch 39/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.7435e-05 - val_loss: 5.2410e-04\n",
"Epoch 40/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.7786e-05 - val_loss: 5.3591e-04\n",
"Epoch 41/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.7503e-05 - val_loss: 5.4940e-04\n",
"Epoch 42/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.6452e-05 - val_loss: 5.4002e-04\n",
"Epoch 43/300\n",
"6/6 [==============================] - 0s 30ms/step - loss: 4.6442e-05 - val_loss: 5.1866e-04\n",
"Epoch 44/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.6059e-05 - val_loss: 5.1688e-04\n",
"Epoch 45/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.5808e-05 - val_loss: 5.2306e-04\n",
"Epoch 46/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.6525e-05 - val_loss: 5.1967e-04\n",
"Epoch 47/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.8092e-05 - val_loss: 5.1659e-04\n",
"Epoch 48/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.7516e-05 - val_loss: 5.2063e-04\n",
"Epoch 49/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.5809e-05 - val_loss: 5.1318e-04\n",
"Epoch 50/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.7254e-05 - val_loss: 5.1308e-04\n",
"Epoch 51/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.5251e-05 - val_loss: 5.5543e-04\n",
"Epoch 52/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.5905e-05 - val_loss: 5.1017e-04\n",
"Epoch 53/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.5034e-05 - val_loss: 5.6716e-04\n",
"Epoch 54/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.5452e-05 - val_loss: 5.2440e-04\n",
"Epoch 55/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.7777e-05 - val_loss: 6.3141e-04\n",
"Epoch 56/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 5.1305e-05 - val_loss: 5.5474e-04\n",
"Epoch 57/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.7679e-05 - val_loss: 5.0443e-04\n",
"Epoch 58/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.5841e-05 - val_loss: 5.0486e-04\n",
"Epoch 59/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.4836e-05 - val_loss: 5.0822e-04\n",
"Epoch 60/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.4979e-05 - val_loss: 5.2020e-04\n",
"Epoch 61/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.4259e-05 - val_loss: 5.0977e-04\n",
"Epoch 62/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.4635e-05 - val_loss: 7.4517e-04\n",
"Epoch 63/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.9458e-05 - val_loss: 5.0636e-04\n",
"Epoch 64/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.9610e-05 - val_loss: 5.0729e-04\n",
"Epoch 65/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.8559e-05 - val_loss: 6.3253e-04\n",
"Epoch 66/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.7167e-05 - val_loss: 5.4755e-04\n",
"Epoch 67/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.7096e-05 - val_loss: 4.9066e-04\n",
"Epoch 68/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.4310e-05 - val_loss: 4.9044e-04\n",
"Epoch 69/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.4141e-05 - val_loss: 5.4068e-04\n",
"Epoch 70/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.9005e-05 - val_loss: 6.0567e-04\n",
"Epoch 71/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.9279e-05 - val_loss: 5.2227e-04\n",
"Epoch 72/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.7606e-05 - val_loss: 6.8591e-04\n",
"Epoch 73/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 5.4288e-05 - val_loss: 5.7212e-04\n",
"Epoch 74/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 5.2279e-05 - val_loss: 4.8281e-04\n",
"Epoch 75/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 5.0421e-05 - val_loss: 5.0018e-04\n",
"Epoch 76/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 5.0324e-05 - val_loss: 6.8538e-04\n",
"Epoch 77/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 5.7253e-05 - val_loss: 6.2901e-04\n",
"Epoch 78/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 5.2506e-05 - val_loss: 5.3627e-04\n",
"Epoch 79/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.8117e-05 - val_loss: 5.5424e-04\n",
"Epoch 80/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.5993e-05 - val_loss: 5.8062e-04\n",
"Epoch 81/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.8207e-05 - val_loss: 5.1133e-04\n",
"Epoch 82/300\n",
"6/6 [==============================] - 0s 37ms/step - loss: 4.9103e-05 - val_loss: 4.7516e-04\n",
"Epoch 83/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.9031e-05 - val_loss: 7.5069e-04\n",
"Epoch 84/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.7567e-05 - val_loss: 4.7432e-04\n",
"Epoch 85/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.3508e-05 - val_loss: 4.7671e-04\n",
"Epoch 86/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.3062e-05 - val_loss: 4.6603e-04\n",
"Epoch 87/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.3116e-05 - val_loss: 4.6714e-04\n",
"Epoch 88/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.3769e-05 - val_loss: 4.9306e-04\n",
"Epoch 89/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.3359e-05 - val_loss: 5.5865e-04\n",
"Epoch 90/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.3120e-05 - val_loss: 5.0523e-04\n",
"Epoch 91/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.3626e-05 - val_loss: 4.6584e-04\n",
"Epoch 92/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.3846e-05 - val_loss: 5.3466e-04\n",
"Epoch 93/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 5.0501e-05 - val_loss: 5.3762e-04\n",
"Epoch 94/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 5.2296e-05 - val_loss: 5.5350e-04\n",
"Epoch 95/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.9425e-05 - val_loss: 4.9249e-04\n",
"Epoch 96/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.7276e-05 - val_loss: 5.4912e-04\n",
"Epoch 97/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.1909e-05 - val_loss: 4.5487e-04\n",
"Epoch 98/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.2255e-05 - val_loss: 4.6518e-04\n",
"Epoch 99/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.3957e-05 - val_loss: 4.6023e-04\n",
"Epoch 100/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.2253e-05 - val_loss: 5.0644e-04\n",
"Epoch 101/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.0570e-05 - val_loss: 4.7234e-04\n",
"Epoch 102/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.0526e-05 - val_loss: 4.8120e-04\n",
"Epoch 103/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.0771e-05 - val_loss: 4.4871e-04\n",
"Epoch 104/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.1719e-05 - val_loss: 4.4550e-04\n",
"Epoch 105/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.2153e-05 - val_loss: 5.8857e-04\n",
"Epoch 106/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.3016e-05 - val_loss: 5.0342e-04\n",
"Epoch 107/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.7574e-05 - val_loss: 4.7303e-04\n",
"Epoch 108/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.3402e-05 - val_loss: 5.7601e-04\n",
"Epoch 109/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.5834e-05 - val_loss: 4.3906e-04\n",
"Epoch 110/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.5280e-05 - val_loss: 4.5233e-04\n",
"Epoch 111/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 4.0639e-05 - val_loss: 4.3581e-04\n",
"Epoch 112/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.1012e-05 - val_loss: 4.4967e-04\n",
"Epoch 113/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.1113e-05 - val_loss: 5.2586e-04\n",
"Epoch 114/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.0591e-05 - val_loss: 4.3176e-04\n",
"Epoch 115/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.0358e-05 - val_loss: 4.7936e-04\n",
"Epoch 116/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.9503e-05 - val_loss: 4.9555e-04\n",
"Epoch 117/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.9956e-05 - val_loss: 4.3167e-04\n",
"Epoch 118/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.9008e-05 - val_loss: 4.3674e-04\n",
"Epoch 119/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.9271e-05 - val_loss: 5.8607e-04\n",
"Epoch 120/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 5.1134e-05 - val_loss: 4.3971e-04\n",
"Epoch 121/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 5.1691e-05 - val_loss: 4.6761e-04\n",
"Epoch 122/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.8591e-05 - val_loss: 5.3190e-04\n",
"Epoch 123/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.1040e-05 - val_loss: 4.2018e-04\n",
"Epoch 124/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.9335e-05 - val_loss: 4.8495e-04\n",
"Epoch 125/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.1402e-05 - val_loss: 4.5981e-04\n",
"Epoch 126/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.1858e-05 - val_loss: 5.0781e-04\n",
"Epoch 127/300\n",
"6/6 [==============================] - 0s 38ms/step - loss: 3.8837e-05 - val_loss: 4.3776e-04\n",
"Epoch 128/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.0212e-05 - val_loss: 4.1703e-04\n",
"Epoch 129/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.2124e-05 - val_loss: 5.8645e-04\n",
"Epoch 130/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.6044e-05 - val_loss: 4.1222e-04\n",
"Epoch 131/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.2733e-05 - val_loss: 4.2163e-04\n",
"Epoch 132/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.9469e-05 - val_loss: 4.2418e-04\n",
"Epoch 133/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.7501e-05 - val_loss: 4.3677e-04\n",
"Epoch 134/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.8176e-05 - val_loss: 4.2952e-04\n",
"Epoch 135/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.0369e-05 - val_loss: 6.6701e-04\n",
"Epoch 136/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.9337e-05 - val_loss: 4.0733e-04\n",
"Epoch 137/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.3170e-05 - val_loss: 4.0414e-04\n",
"Epoch 138/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.1523e-05 - val_loss: 5.1315e-04\n",
"Epoch 139/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.0638e-05 - val_loss: 4.1847e-04\n",
"Epoch 140/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.0677e-05 - val_loss: 4.3206e-04\n",
"Epoch 141/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.0680e-05 - val_loss: 5.6356e-04\n",
"Epoch 142/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.2306e-05 - val_loss: 4.1415e-04\n",
"Epoch 143/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.0676e-05 - val_loss: 3.9718e-04\n",
"Epoch 144/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.7425e-05 - val_loss: 4.8362e-04\n",
"Epoch 145/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.0463e-05 - val_loss: 4.2217e-04\n",
"Epoch 146/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.6883e-05 - val_loss: 3.9380e-04\n",
"Epoch 147/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.6913e-05 - val_loss: 3.9412e-04\n",
"Epoch 148/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.0054e-05 - val_loss: 4.6880e-04\n",
"Epoch 149/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.7090e-05 - val_loss: 3.9191e-04\n",
"Epoch 150/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.7152e-05 - val_loss: 3.9188e-04\n",
"Epoch 151/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.5870e-05 - val_loss: 4.0480e-04\n",
"Epoch 152/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.6648e-05 - val_loss: 3.9267e-04\n",
"Epoch 153/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 3.7164e-05 - val_loss: 5.5292e-04\n",
"Epoch 154/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.0360e-05 - val_loss: 3.8849e-04\n",
"Epoch 155/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.8028e-05 - val_loss: 4.0467e-04\n",
"Epoch 156/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.8752e-05 - val_loss: 4.3394e-04\n",
"Epoch 157/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.6166e-05 - val_loss: 4.1157e-04\n",
"Epoch 158/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.7406e-05 - val_loss: 3.9664e-04\n",
"Epoch 159/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.5835e-05 - val_loss: 4.7533e-04\n",
"Epoch 160/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.7883e-05 - val_loss: 3.7862e-04\n",
"Epoch 161/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.7002e-05 - val_loss: 4.1774e-04\n",
"Epoch 162/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.0066e-05 - val_loss: 3.9038e-04\n",
"Epoch 163/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.7831e-05 - val_loss: 3.7863e-04\n",
"Epoch 164/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.6573e-05 - val_loss: 3.8238e-04\n",
"Epoch 165/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.7520e-05 - val_loss: 3.7538e-04\n",
"Epoch 166/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.5161e-05 - val_loss: 4.0763e-04\n",
"Epoch 167/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.7949e-05 - val_loss: 3.7453e-04\n",
"Epoch 168/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.5391e-05 - val_loss: 3.7064e-04\n",
"Epoch 169/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.7920e-05 - val_loss: 3.6871e-04\n",
"Epoch 170/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.6607e-05 - val_loss: 4.5369e-04\n",
"Epoch 171/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.6203e-05 - val_loss: 3.6751e-04\n",
"Epoch 172/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.5052e-05 - val_loss: 4.9162e-04\n",
"Epoch 173/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.7034e-05 - val_loss: 3.8094e-04\n",
"Epoch 174/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.6693e-05 - val_loss: 4.2844e-04\n",
"Epoch 175/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.6451e-05 - val_loss: 3.9608e-04\n",
"Epoch 176/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.4949e-05 - val_loss: 3.6128e-04\n",
"Epoch 177/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.4564e-05 - val_loss: 3.7150e-04\n",
"Epoch 178/300\n",
"6/6 [==============================] - 0s 37ms/step - loss: 3.5198e-05 - val_loss: 3.7639e-04\n",
"Epoch 179/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.6648e-05 - val_loss: 3.8561e-04\n",
"Epoch 180/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.7191e-05 - val_loss: 4.2380e-04\n",
"Epoch 181/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.8103e-05 - val_loss: 3.6462e-04\n",
"Epoch 182/300\n",
"6/6 [==============================] - 0s 30ms/step - loss: 3.5416e-05 - val_loss: 6.5856e-04\n",
"Epoch 183/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.5402e-05 - val_loss: 3.8154e-04\n",
"Epoch 184/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.5820e-05 - val_loss: 6.0560e-04\n",
"Epoch 185/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.0189e-05 - val_loss: 4.0743e-04\n",
"Epoch 186/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.9509e-05 - val_loss: 3.7497e-04\n",
"Epoch 187/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.7833e-05 - val_loss: 3.7615e-04\n",
"Epoch 188/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.5893e-05 - val_loss: 3.5360e-04\n",
"Epoch 189/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.5397e-05 - val_loss: 3.4571e-04\n",
"Epoch 190/300\n",
"6/6 [==============================] - 0s 31ms/step - loss: 3.4754e-05 - val_loss: 3.7442e-04\n",
"Epoch 191/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.3364e-05 - val_loss: 3.7269e-04\n",
"Epoch 192/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.3811e-05 - val_loss: 3.9378e-04\n",
"Epoch 193/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.5349e-05 - val_loss: 3.4427e-04\n",
"Epoch 194/300\n",
"6/6 [==============================] - 0s 30ms/step - loss: 3.8081e-05 - val_loss: 4.5326e-04\n",
"Epoch 195/300\n",
"6/6 [==============================] - 0s 31ms/step - loss: 3.5818e-05 - val_loss: 3.8512e-04\n",
"Epoch 196/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 3.6307e-05 - val_loss: 3.8736e-04\n",
"Epoch 197/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.4238e-05 - val_loss: 3.4454e-04\n",
"Epoch 198/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.4051e-05 - val_loss: 3.4162e-04\n",
"Epoch 199/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.5975e-05 - val_loss: 3.7907e-04\n",
"Epoch 200/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.4723e-05 - val_loss: 3.5411e-04\n",
"Epoch 201/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.5441e-05 - val_loss: 3.4065e-04\n",
"Epoch 202/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.2994e-05 - val_loss: 3.3443e-04\n",
"Epoch 203/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 3.2386e-05 - val_loss: 3.3433e-04\n",
"Epoch 204/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 3.2532e-05 - val_loss: 4.9409e-04\n",
"Epoch 205/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.6390e-05 - val_loss: 3.5703e-04\n",
"Epoch 206/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.7373e-05 - val_loss: 3.7756e-04\n",
"Epoch 207/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.8520e-05 - val_loss: 3.7989e-04\n",
"Epoch 208/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.7669e-05 - val_loss: 3.5140e-04\n",
"Epoch 209/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.4343e-05 - val_loss: 4.0296e-04\n",
"Epoch 210/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.4826e-05 - val_loss: 3.3830e-04\n",
"Epoch 211/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.4411e-05 - val_loss: 3.2794e-04\n",
"Epoch 212/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.3735e-05 - val_loss: 3.2816e-04\n",
"Epoch 213/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.2009e-05 - val_loss: 3.8783e-04\n",
"Epoch 214/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.2901e-05 - val_loss: 3.4561e-04\n",
"Epoch 215/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.2039e-05 - val_loss: 3.2541e-04\n",
"Epoch 216/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1737e-05 - val_loss: 3.3265e-04\n",
"Epoch 217/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1533e-05 - val_loss: 3.2900e-04\n",
"Epoch 218/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.1495e-05 - val_loss: 3.7068e-04\n",
"Epoch 219/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1388e-05 - val_loss: 3.3259e-04\n",
"Epoch 220/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1156e-05 - val_loss: 4.0736e-04\n",
"Epoch 221/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1986e-05 - val_loss: 3.2558e-04\n",
"Epoch 222/300\n",
"6/6 [==============================] - 0s 35ms/step - loss: 3.2770e-05 - val_loss: 4.9332e-04\n",
"Epoch 223/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.5997e-05 - val_loss: 3.2944e-04\n",
"Epoch 224/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.3435e-05 - val_loss: 4.8294e-04\n",
"Epoch 225/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.4517e-05 - val_loss: 3.3350e-04\n",
"Epoch 226/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1024e-05 - val_loss: 3.2739e-04\n",
"Epoch 227/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.0829e-05 - val_loss: 3.1635e-04\n",
"Epoch 228/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.1500e-05 - val_loss: 3.6727e-04\n",
"Epoch 229/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1012e-05 - val_loss: 3.1509e-04\n",
"Epoch 230/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.0797e-05 - val_loss: 3.9436e-04\n",
"Epoch 231/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.1639e-05 - val_loss: 3.3696e-04\n",
"Epoch 232/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.0828e-05 - val_loss: 3.5289e-04\n",
"Epoch 233/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1682e-05 - val_loss: 3.9576e-04\n",
"Epoch 234/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.4716e-05 - val_loss: 3.7956e-04\n",
"Epoch 235/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.9644e-05 - val_loss: 5.6274e-04\n",
"Epoch 236/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.5305e-05 - val_loss: 3.1149e-04\n",
"Epoch 237/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.1806e-05 - val_loss: 3.6977e-04\n",
"Epoch 238/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 3.2046e-05 - val_loss: 3.1771e-04\n",
"Epoch 239/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.1964e-05 - val_loss: 3.1637e-04\n",
"Epoch 240/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.0958e-05 - val_loss: 3.5127e-04\n",
"Epoch 241/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.2261e-05 - val_loss: 3.0755e-04\n",
"Epoch 242/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.4718e-05 - val_loss: 4.4235e-04\n",
"Epoch 243/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.4675e-05 - val_loss: 3.1811e-04\n",
"Epoch 244/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.3075e-05 - val_loss: 3.8481e-04\n",
"Epoch 245/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.0910e-05 - val_loss: 3.2136e-04\n",
"Epoch 246/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.3528e-05 - val_loss: 4.6475e-04\n",
"Epoch 247/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.6748e-05 - val_loss: 3.0626e-04\n",
"Epoch 248/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 3.2193e-05 - val_loss: 3.0778e-04\n",
"Epoch 249/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.0542e-05 - val_loss: 3.7856e-04\n",
"Epoch 250/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.1912e-05 - val_loss: 3.0847e-04\n",
"Epoch 251/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.5287e-05 - val_loss: 3.2022e-04\n",
"Epoch 252/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1589e-05 - val_loss: 3.1819e-04\n",
"Epoch 253/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 2.9823e-05 - val_loss: 3.0381e-04\n",
"Epoch 254/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.0014e-05 - val_loss: 3.6404e-04\n",
"Epoch 255/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.2922e-05 - val_loss: 3.0589e-04\n",
"Epoch 256/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 2.9711e-05 - val_loss: 4.4349e-04\n",
"Epoch 257/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.3159e-05 - val_loss: 3.6379e-04\n",
"Epoch 258/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.3526e-05 - val_loss: 3.0306e-04\n",
"Epoch 259/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.0376e-05 - val_loss: 3.5862e-04\n",
"Epoch 260/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 2.9825e-05 - val_loss: 3.1904e-04\n",
"Epoch 261/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1879e-05 - val_loss: 3.4188e-04\n",
"Epoch 262/300\n",
"6/6 [==============================] - 0s 37ms/step - loss: 3.3935e-05 - val_loss: 3.5108e-04\n",
"Epoch 263/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.0101e-05 - val_loss: 3.0878e-04\n",
"Epoch 264/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 2.9251e-05 - val_loss: 2.9988e-04\n",
"Epoch 265/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 2.9135e-05 - val_loss: 3.1429e-04\n",
"Epoch 266/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1148e-05 - val_loss: 3.2367e-04\n",
"Epoch 267/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.0476e-05 - val_loss: 2.9820e-04\n",
"Epoch 268/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 2.9238e-05 - val_loss: 3.2258e-04\n",
"Epoch 269/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 2.9202e-05 - val_loss: 2.9815e-04\n",
"Epoch 270/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1455e-05 - val_loss: 3.2140e-04\n",
"Epoch 271/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 2.9394e-05 - val_loss: 3.6962e-04\n",
"Epoch 272/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.0026e-05 - val_loss: 3.0022e-04\n",
"Epoch 273/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.0705e-05 - val_loss: 4.9474e-04\n",
"Epoch 274/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.4969e-05 - val_loss: 3.0065e-04\n",
"Epoch 275/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1780e-05 - val_loss: 3.2616e-04\n",
"Epoch 276/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.0128e-05 - val_loss: 3.0402e-04\n",
"Epoch 277/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.4030e-05 - val_loss: 6.9602e-04\n",
"Epoch 278/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 4.2202e-05 - val_loss: 3.0068e-04\n",
"Epoch 279/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.0910e-05 - val_loss: 3.0203e-04\n",
"Epoch 280/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.0341e-05 - val_loss: 3.4467e-04\n",
"Epoch 281/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.5805e-05 - val_loss: 2.9584e-04\n",
"Epoch 282/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1648e-05 - val_loss: 3.5150e-04\n",
"Epoch 283/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.4300e-05 - val_loss: 3.0483e-04\n",
"Epoch 284/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 2.8822e-05 - val_loss: 3.5656e-04\n",
"Epoch 285/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.6199e-05 - val_loss: 6.8535e-04\n",
"Epoch 286/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 4.1642e-05 - val_loss: 3.7541e-04\n",
"Epoch 287/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.8214e-05 - val_loss: 4.0116e-04\n",
"Epoch 288/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.2742e-05 - val_loss: 2.9232e-04\n",
"Epoch 289/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 2.9566e-05 - val_loss: 3.0349e-04\n",
"Epoch 290/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 2.8411e-05 - val_loss: 3.5827e-04\n",
"Epoch 291/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 2.9510e-05 - val_loss: 3.1645e-04\n",
"Epoch 292/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 3.2016e-05 - val_loss: 4.0342e-04\n",
"Epoch 293/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.0703e-05 - val_loss: 2.9043e-04\n",
"Epoch 294/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.1408e-05 - val_loss: 2.9512e-04\n",
"Epoch 295/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 2.8574e-05 - val_loss: 3.0567e-04\n",
"Epoch 296/300\n",
"6/6 [==============================] - 0s 35ms/step - loss: 2.8477e-05 - val_loss: 3.2119e-04\n",
"Epoch 297/300\n",
"6/6 [==============================] - 0s 29ms/step - loss: 2.9123e-05 - val_loss: 3.8052e-04\n",
"Epoch 298/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 3.2265e-05 - val_loss: 3.0611e-04\n",
"Epoch 299/300\n",
"6/6 [==============================] - 0s 27ms/step - loss: 2.9846e-05 - val_loss: 3.6055e-04\n",
"Epoch 300/300\n",
"6/6 [==============================] - 0s 28ms/step - loss: 2.9634e-05 - val_loss: 2.9422e-04\n"
]
}
],
"source": [
"# Training the model\n",
"epochs = 300\n",
"history1 = model1.fit(x_train1, y_train1, batch_size=512, epochs=epochs, validation_data=(x_test1, y_test1))"
]
},
{
"cell_type": "code",
"execution_count": 34,
"id": "dd1998bc-5ad2-4db7-83f0-156b52b79d78",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "",
"text/plain": [
""
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# Plotting Loss Curve\n",
"plotLossCurve(history1,\"red\", \"Model 1 Loss\") "
]
},
{
"cell_type": "markdown",
"id": "55fc1c73-7b1d-46a0-8d90-112328196d23",
"metadata": {},
"source": [
"#### Hmm.. My loss is still pretty high. Maybe I'll try it with more epochs later"
]
},
{
"cell_type": "code",
"execution_count": 35,
"id": "7559641e-9e23-4877-b153-d9b169467ddc",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"22/22 [==============================] - 1s 18ms/step\n",
"Median Absolute Error (MAE): 1.79\n",
"Mean Absolute Percentage Error (MAPE): 1.55 %\n",
"Median Absolute Percentage Error (MDAPE): 1.12 %\n"
]
}
],
"source": [
"# Evaluating model\n",
"MAE1, MAPE1, MDAPE1, y_pred1= eval(model1, x_test1, y_test1, scaler_pred1)"
]
},
{
"cell_type": "code",
"execution_count": 36,
"id": "0ac5630b-239f-4c36-9789-f2463a772a16",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "",
"text/plain": [
""
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# Visualising Predictions\n",
"visualizePreds(data_filtered1, train_data_len1, y_pred1, date_index1, \"orange\")"
]
},
{
"cell_type": "markdown",
"id": "da42add1-1f67-43d3-9e7c-9d0dc2e7b495",
"metadata": {},
"source": [
"#### Where is my Train data? Fix this later.\n",
"\n",
"### Predict tomorrow's price"
]
},
{
"cell_type": "code",
"execution_count": 37,
"id": "8becd22c-a2a2-4e81-ae80-43bd98c1a60e",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"1/1 [==============================] - 0s 28ms/step\n",
"The close price for GOOG at 2023-10-19 was 139.28\n",
"The predicted close price is 140.5500030517578 (+0.9%)\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"/tmp/ipykernel_15950/3096130203.py:16: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
" price_today = np.round(new_df['Close'][-1], 2)\n"
]
}
],
"source": [
"predictFuturePrice(model1, df, sequence_length1, features1, scaler1, scaler_pred1)"
]
},
{
"cell_type": "markdown",
"id": "9f3d7414-56b0-4063-92a7-401dc622bd8c",
"metadata": {},
"source": [
"### Accurate prediction within 0.9%!\n",
"### Now let's add Sentiment Analysis"
]
},
{
"cell_type": "markdown",
"id": "7f445d28-9f12-4347-a4ca-8510b883aaa9",
"metadata": {},
"source": [
"## BERT Sentiment Analysis\n",
"\n",
"##### Going to use tweet data"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "463ece8c-b7e5-471f-9af6-727a1338f89f",
"metadata": {},
"outputs": [],
"source": [
"import os\n",
"import csv\n",
"import json\n",
"import datetime\n",
"import pandas as pd\n",
"from tqdm import tqdm\n",
"import snscrape.modules.twitter as sntwitter\n",
"\n",
"path = \"./GOOG_tweets.json\"\n",
"\n",
"if os.path.isfile(stockname + '_tweets.json'):\n",
" print(\"File already exits...no need to scrape it again\")\n",
" print(\"To scrape again, delete : \" + stockname + '_tweets.json')\n",
"else:\n",
" maxTweets = 3\n",
" start_date = date_start.date()\n",
" period = (date_today - start_date).days\n",
"\n",
" tweets = dict()\n",
" for i in tqdm(range(period)):\n",
" dayTweets=list()\n",
" start_interval = start_date\n",
" end_interval = start_interval + datetime.timedelta(days=1)\n",
" try: \n",
" for i,tweet in enumerate(sntwitter.TwitterSearchScraper('#Apple + OR @Apple + since:' + str(start_interval) + ' until:' + str(end_interval) +' -filter:links -filter:replies lang:\"en\" ').get_items()):\n",
" if i > maxTweets :\n",
" break \n",
" dayTweets.append(tweet.content)\n",
" key = start_date.strftime('%d/%m/%Y')\n",
" tweets[key] = dayTweets\n",
" start_date += datetime.timedelta(days=1) \n",
" except Exception as e:\n",
" print(i,e)\n",
" pass\n",
"\n",
" with open( stockname + '_tweets.json', 'w') as fp:\n",
" json.dump(tweets, fp)"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "72ccf9fe-9fac-475a-8eb8-a42f63e14150",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" Open | \n",
" High | \n",
" Low | \n",
" Close | \n",
" Adj Close | \n",
" Volume | \n",
" Unnamed: 0 | \n",
" NEG | \n",
" NEU | \n",
" POS | \n",
"
\n",
" \n",
" Date | \n",
" | \n",
" | \n",
" | \n",
" | \n",
" | \n",
" | \n",
" | \n",
" | \n",
" | \n",
" | \n",
"
\n",
" \n",
" \n",
" \n",
"
\n",
"
"
],
"text/plain": [
"Empty DataFrame\n",
"Columns: [Open, High, Low, Close, Adj Close, Volume, Unnamed: 0, NEG, NEU, POS]\n",
"Index: []"
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_senti = pd.read_csv('GOOG_senti_scores.csv')\n",
"df_senti.set_index('Date', inplace=True)\n",
"df2 = df.join(df_senti, how='inner')\n",
"df2.head()"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "d0948923-b6eb-41d0-8618-1ac9f9a586f4",
"metadata": {},
"outputs": [],
"source": [
"import json\n",
"f = open(stockname + '_tweets.json',)\n",
"data = json.load(f)\n",
"\n",
"dates = list()\n",
"NEG = list()\n",
"NEU = list()\n",
"POS = list()\n",
"\n",
"for key in tqdm(data):\n",
" reviews = data[key]\n",
" pos=0\n",
" neg=0\n",
" neu=0\n",
" cnt=0\n",
" for text in reviews:\n",
" cnt=cnt+1\n",
" text = preprocess(text)\n",
" encoded_input = tokenizer(text, return_tensors='pt')\n",
" output = model(**encoded_input)\n",
" scores = output[0][0].detach().numpy()\n",
" scores = softmax(scores)\n",
" neg=neg+scores[0]\n",
" neu=neu+scores[1]\n",
" pos=pos+scores[2]\n",
"\n",
" NEG.append(neg/cnt)\n",
" NEU.append(neu/cnt)\n",
" POS.append(pos/cnt)\n",
" dates.append(datetime.strptime(str(key), \"%d/%m/%Y\"))"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "5d07d84b-cd46-49e3-a5b8-46a2aa832a4b",
"metadata": {},
"outputs": [],
"source": [
"\n",
"import csv\n",
"import json\n",
"import datetime\n",
"import pandas as pd\n",
"from tqdm import tqdm\n",
"import snscrape.modules.twitter as sntwitter\n",
"\n",
"if os.path.isfile(stockname + '_tweets.json'):\n",
" print(\"File already exists...no need to scrape it again\")\n",
" print(\"To scrape again, delete : \" + stockname + '_tweets.json')\n",
"else:\n",
" maxTweets = 3\n",
" start_date = date_start.date()\n",
" period = (date_today - start_date).days\n",
"\n",
" tweets = dict()\n",
" for i in tqdm(range(period)):\n",
" dayTweets=list()\n",
" start_interval = start_date\n",
" end_interval = start_interval + datetime.timedelta(days=1)\n",
" try: \n",
" for i,tweet in enumerate(sntwitter.TwitterSearchScraper('#Google + OR @Google + since:' + str(start_interval) + ' until:' + str(end_interval) +' -filter:links -filter:replies lang:\"en\" ').get_items()):\n",
" if i > maxTweets :\n",
" break \n",
" dayTweets.append(tweet.content)\n",
" key = start_date.strftime('%d/%m/%Y')\n",
" tweets[key] = dayTweets\n",
" start_date += datetime.timedelta(days=1) \n",
" except Exception as e:\n",
" print(i,e)\n",
" pass\n",
"\n",
" with open( stockname + '_tweets.json', 'w') as fp:\n",
" json.dump(tweets, fp)"
]
},
{
"cell_type": "code",
"execution_count": 40,
"id": "a2400087-ba13-4822-8805-32d0a1e117d3",
"metadata": {},
"outputs": [],
"source": [
"import os, csv\n",
"import urllib.request\n",
"from scipy.special import softmax\n",
"from transformers import AutoModelForSequenceClassification\n",
"from transformers import TFAutoModelForSequenceClassification\n",
"from transformers import AutoTokenizer"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "f144ad58-e91b-41f7-aa32-378de57704e3",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.10.12"
},
"widgets": {
"application/vnd.jupyter.widget-state+json": {
"state": {},
"version_major": 2,
"version_minor": 0
}
}
},
"nbformat": 4,
"nbformat_minor": 5
}