{
"cells": [
{
"cell_type": "markdown",
"id": "db9bc293",
"metadata": {},
"source": [
"## Name : ADVAIT GURUNATH CHAVAN\n",
"## Contact Number : +91 70214 55852\n",
"## Mail ID : advaitchavan135@gmail.com \n",
"\n",
"## Oasis Infobyte Data Science Intern\n",
"\n",
"## Task 5 : Sales Predicition using Python"
]
},
{
"cell_type": "markdown",
"id": "cb2c0a17",
"metadata": {},
"source": [
"
"
]
},
{
"cell_type": "markdown",
"id": "d8e860ae",
"metadata": {},
"source": [
"## 1. Importing the necessary dependencies"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "f9a33522",
"metadata": {},
"outputs": [],
"source": [
"import pandas as pd\n",
"import matplotlib.pyplot as plt\n",
"import numpy as np\n",
"import seaborn as sns\n",
"import plotly.io as plio\n",
"plio.templates\n",
"import plotly.express as px\n",
"import plotly.graph_objects as go\n",
"from sklearn.model_selection import train_test_split\n",
"\n",
"from sklearn.metrics import mean_squared_error, r2_score\n",
"\n",
"from sklearn.linear_model import LinearRegression, Ridge, Lasso, ElasticNet\n",
"from sklearn.ensemble import RandomForestRegressor, GradientBoostingRegressor\n",
"\n",
"from xgboost import XGBRegressor\n",
"\n",
"import joblib\n",
"\n",
"from warnings import filterwarnings\n",
"filterwarnings(action='ignore')"
]
},
{
"cell_type": "markdown",
"id": "7d9d5f85",
"metadata": {},
"source": [
"## 2. Exploring the dataset"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "6b16f8c6",
"metadata": {},
"outputs": [],
"source": [
"data = pd.read_csv('advertising.csv')"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "95c0b763",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"
| \n", " | Unnamed: 0 | \n", "TV | \n", "Radio | \n", "Newspaper | \n", "Sales | \n", "
|---|---|---|---|---|---|
| 0 | \n", "1 | \n", "230.1 | \n", "37.8 | \n", "69.2 | \n", "22.1 | \n", "
| 1 | \n", "2 | \n", "44.5 | \n", "39.3 | \n", "45.1 | \n", "10.4 | \n", "
| 2 | \n", "3 | \n", "17.2 | \n", "45.9 | \n", "69.3 | \n", "9.3 | \n", "
| 3 | \n", "4 | \n", "151.5 | \n", "41.3 | \n", "58.5 | \n", "18.5 | \n", "
| 4 | \n", "5 | \n", "180.8 | \n", "10.8 | \n", "58.4 | \n", "12.9 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 195 | \n", "196 | \n", "38.2 | \n", "3.7 | \n", "13.8 | \n", "7.6 | \n", "
| 196 | \n", "197 | \n", "94.2 | \n", "4.9 | \n", "8.1 | \n", "9.7 | \n", "
| 197 | \n", "198 | \n", "177.0 | \n", "9.3 | \n", "6.4 | \n", "12.8 | \n", "
| 198 | \n", "199 | \n", "283.6 | \n", "42.0 | \n", "66.2 | \n", "25.5 | \n", "
| 199 | \n", "200 | \n", "232.1 | \n", "8.6 | \n", "8.7 | \n", "13.4 | \n", "
200 rows × 5 columns
\n", "| \n", " | TV | \n", "Radio | \n", "Newspaper | \n", "Sales | \n", "
|---|---|---|---|---|
| 0 | \n", "230.1 | \n", "37.8 | \n", "69.2 | \n", "22.1 | \n", "
| 1 | \n", "44.5 | \n", "39.3 | \n", "45.1 | \n", "10.4 | \n", "
| 2 | \n", "17.2 | \n", "45.9 | \n", "69.3 | \n", "9.3 | \n", "
| 3 | \n", "151.5 | \n", "41.3 | \n", "58.5 | \n", "18.5 | \n", "
| 4 | \n", "180.8 | \n", "10.8 | \n", "58.4 | \n", "12.9 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 195 | \n", "38.2 | \n", "3.7 | \n", "13.8 | \n", "7.6 | \n", "
| 196 | \n", "94.2 | \n", "4.9 | \n", "8.1 | \n", "9.7 | \n", "
| 197 | \n", "177.0 | \n", "9.3 | \n", "6.4 | \n", "12.8 | \n", "
| 198 | \n", "283.6 | \n", "42.0 | \n", "66.2 | \n", "25.5 | \n", "
| 199 | \n", "232.1 | \n", "8.6 | \n", "8.7 | \n", "13.4 | \n", "
200 rows × 4 columns
\n", "| \n", " | TV | \n", "Radio | \n", "Newspaper | \n", "Sales | \n", "
|---|---|---|---|---|
| count | \n", "200.000000 | \n", "200.000000 | \n", "200.000000 | \n", "200.000000 | \n", "
| mean | \n", "147.042500 | \n", "23.264000 | \n", "30.554000 | \n", "14.022500 | \n", "
| std | \n", "85.854236 | \n", "14.846809 | \n", "21.778621 | \n", "5.217457 | \n", "
| min | \n", "0.700000 | \n", "0.000000 | \n", "0.300000 | \n", "1.600000 | \n", "
| 25% | \n", "74.375000 | \n", "9.975000 | \n", "12.750000 | \n", "10.375000 | \n", "
| 50% | \n", "149.750000 | \n", "22.900000 | \n", "25.750000 | \n", "12.900000 | \n", "
| 75% | \n", "218.825000 | \n", "36.525000 | \n", "45.100000 | \n", "17.400000 | \n", "
| max | \n", "296.400000 | \n", "49.600000 | \n", "114.000000 | \n", "27.000000 | \n", "
| \n", " | TV | \n", "Radio | \n", "Newspaper | \n", "
|---|---|---|---|
| 0 | \n", "230.1 | \n", "37.8 | \n", "69.2 | \n", "
| 1 | \n", "44.5 | \n", "39.3 | \n", "45.1 | \n", "
| 2 | \n", "17.2 | \n", "45.9 | \n", "69.3 | \n", "
| 3 | \n", "151.5 | \n", "41.3 | \n", "58.5 | \n", "
| 4 | \n", "180.8 | \n", "10.8 | \n", "58.4 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "
| 195 | \n", "38.2 | \n", "3.7 | \n", "13.8 | \n", "
| 196 | \n", "94.2 | \n", "4.9 | \n", "8.1 | \n", "
| 197 | \n", "177.0 | \n", "9.3 | \n", "6.4 | \n", "
| 198 | \n", "283.6 | \n", "42.0 | \n", "66.2 | \n", "
| 199 | \n", "232.1 | \n", "8.6 | \n", "8.7 | \n", "
200 rows × 3 columns
\n", "| \n", " | Sales | \n", "
|---|---|
| 0 | \n", "22.1 | \n", "
| 1 | \n", "10.4 | \n", "
| 2 | \n", "9.3 | \n", "
| 3 | \n", "18.5 | \n", "
| 4 | \n", "12.9 | \n", "
| ... | \n", "... | \n", "
| 195 | \n", "7.6 | \n", "
| 196 | \n", "9.7 | \n", "
| 197 | \n", "12.8 | \n", "
| 198 | \n", "25.5 | \n", "
| 199 | \n", "13.4 | \n", "
200 rows × 1 columns
\n", "