{ "cells": [ { "cell_type": "markdown", "id": "3e29cbdb-a52a-40d0-8b56-eeba5fc2f9ec", "metadata": { "canvas": { "comments": [], "componentType": "CodeCell", "copiedOriginId": null, "diskcache": false, "headerColor": "inherit", "id": "73ec4c5e-654b-4690-8e78-4741d28639c3", "isComponent": false, "name": "", "parents": [] }, "tags": [] }, "source": [ "# Iris Data Classification\n", "- Link Component Color Annotations\n", " - Yellow : data load / preprocessing\n", " - Green : EDA\n", " - Violet : model train / predict" ] }, { "cell_type": "markdown", "id": "1f1812ad-d273-4a63-81c6-0485854902fd", "metadata": { "canvas": { "comments": [], "componentType": "CodeCell", "copiedOriginId": null, "diskcache": false, "headerColor": "inherit", "id": "412fd885-1b58-43cc-9b49-579287bc041d", "isComponent": false, "name": "", "parents": [] }, "tags": [] }, "source": [ "### Required Python Packages\n", "- `numpy`\n", "- `pandas`\n", "- `scikit-learn`\n", "- `seaborn`\n", "- `matplotlib`\n", "\n", "Run the following cell to install the packages." ] }, { "cell_type": "code", "execution_count": null, "id": "8867b11a-5d5b-4346-9848-a939e2e4adce", "metadata": { "canvas": { "comments": [], "componentType": "CodeCell", "copiedOriginId": null, "diskcache": false, "headerColor": "inherit", "id": "4022f772-1eec-4bbe-877e-ef196827fb32", "isComponent": false, "name": "", "parents": [] } }, "outputs": [], "source": [ "#\n", "# Required Packages\n", "# Run this cell to install required packages.\n", "#\n", "%pip install \"matplotlib>=2.0\" \"numpy>=1.19\" \"pandas>=1.1\" \"scikit-learn>=0.22.2\" \"seaborn>=0.11\"" ] }, { "cell_type": "markdown", "id": "2fb89b64-10ef-40f2-87cd-49fb42b82952", "metadata": { "canvas": { "comments": [], "componentType": "CodeCell", "copiedOriginId": null, "diskcache": false, "headerColor": "inherit", "id": "bf338eaf-cf47-4680-bc99-9cf3bd0fa5fd", "isComponent": false, "name": "", "parents": [] } }, "source": [ "### 0. Global Parameters\n", "- global paprameter of link pipeline\n", " - test_size : rate of valid-set when train-valid-split\n", " - random_state : random_state " ] }, { "cell_type": "markdown", "id": "d4c974d6-679e-4854-95b1-c31ca2660855", "metadata": { "canvas": { "comments": [], "componentType": "CodeCell", "copiedOriginId": null, "diskcache": false, "headerColor": "inherit", "id": "a16d8c78-8820-4f89-87c5-dfbdd31e7189", "isComponent": false, "name": "", "parents": [] } }, "source": ["### 1. Load package,data"] }, { "cell_type": "code", "execution_count": null, "id": "4d992b20-ccb3-461a-a179-837be66ed332", "metadata": { "canvas": { "comments": [], "componentType": "CodeCell", "copiedOriginId": null, "diskcache": false, "headerColor": "#FAFF00", "id": "3775bea6-ddd5-4b03-a71f-fefa8e117d17", "isComponent": true, "name": "Import packages", "parents": [] }, "tags": [] }, "outputs": [], "source": [ "import matplotlib.pyplot as plt\n", "import numpy as np\n", "import pandas as pd\n", "import seaborn as sns\n", "from sklearn.datasets import load_iris\n", "from sklearn.ensemble import RandomForestClassifier, VotingClassifier\n", "from sklearn.linear_model import LogisticRegression\n", "from sklearn.metrics import accuracy_score\n", "from sklearn.model_selection import train_test_split\n", "from sklearn.neighbors import KNeighborsClassifier" ] }, { "cell_type": "code", "execution_count": null, "id": "d70ec00b-7f5a-4966-9745-4c701c277bb5", "metadata": { "canvas": { "comments": [], "componentType": "CodeCell", "copiedOriginId": null, "diskcache": false, "headerColor": "#FAFF00", "id": "efb0edc1-0372-4bfe-a92c-e481b84ba186", "isComponent": true, "name": "Load data", "parents": [ { "id": "3775bea6-ddd5-4b03-a71f-fefa8e117d17", "name": "Import packages" } ] }, "tags": [] }, "outputs": [], "source": ["iris = load_iris()"] }, { "cell_type": "code", "execution_count": null, "id": "4e1fa4fe-2e65-478b-9a6c-adc479d4840a", "metadata": { "canvas": { "comments": [], "componentType": "CodeCell", "copiedOriginId": null, "diskcache": false, "headerColor": "#FAFF00", "id": "d691b23d-85e0-4ff1-ab92-dacf4e4ed3bc", "isComponent": true, "name": "Create dataframe", "parents": [ { "id": "efb0edc1-0372-4bfe-a92c-e481b84ba186", "name": "Load data" } ] }, "tags": [] }, "outputs": [ { "data": { "text/html": [ "
\n", " | sepal length (cm) | \n", "sepal width (cm) | \n", "petal length (cm) | \n", "petal width (cm) | \n", "target | \n", "
---|---|---|---|---|---|
0 | \n", "5.1 | \n", "3.5 | \n", "1.4 | \n", "0.2 | \n", "0 | \n", "
1 | \n", "4.9 | \n", "3.0 | \n", "1.4 | \n", "0.2 | \n", "0 | \n", "
2 | \n", "4.7 | \n", "3.2 | \n", "1.3 | \n", "0.2 | \n", "0 | \n", "
3 | \n", "4.6 | \n", "3.1 | \n", "1.5 | \n", "0.2 | \n", "0 | \n", "
4 | \n", "5.0 | \n", "3.6 | \n", "1.4 | \n", "0.2 | \n", "0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
145 | \n", "6.7 | \n", "3.0 | \n", "5.2 | \n", "2.3 | \n", "2 | \n", "
146 | \n", "6.3 | \n", "2.5 | \n", "5.0 | \n", "1.9 | \n", "2 | \n", "
147 | \n", "6.5 | \n", "3.0 | \n", "5.2 | \n", "2.0 | \n", "2 | \n", "
148 | \n", "6.2 | \n", "3.4 | \n", "5.4 | \n", "2.3 | \n", "2 | \n", "
149 | \n", "5.9 | \n", "3.0 | \n", "5.1 | \n", "1.8 | \n", "2 | \n", "
150 rows × 5 columns
\n", "\n", " | sepal length (cm) | \n", "sepal width (cm) | \n", "petal length (cm) | \n", "petal width (cm) | \n", "target | \n", "
---|---|---|---|---|---|
0 | \n", "5.1 | \n", "3.5 | \n", "1.4 | \n", "0.2 | \n", "setosa | \n", "
1 | \n", "4.9 | \n", "3.0 | \n", "1.4 | \n", "0.2 | \n", "setosa | \n", "
2 | \n", "4.7 | \n", "3.2 | \n", "1.3 | \n", "0.2 | \n", "setosa | \n", "
3 | \n", "4.6 | \n", "3.1 | \n", "1.5 | \n", "0.2 | \n", "setosa | \n", "
4 | \n", "5.0 | \n", "3.6 | \n", "1.4 | \n", "0.2 | \n", "setosa | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
145 | \n", "6.7 | \n", "3.0 | \n", "5.2 | \n", "2.3 | \n", "virginica | \n", "
146 | \n", "6.3 | \n", "2.5 | \n", "5.0 | \n", "1.9 | \n", "virginica | \n", "
147 | \n", "6.5 | \n", "3.0 | \n", "5.2 | \n", "2.0 | \n", "virginica | \n", "
148 | \n", "6.2 | \n", "3.4 | \n", "5.4 | \n", "2.3 | \n", "virginica | \n", "
149 | \n", "5.9 | \n", "3.0 | \n", "5.1 | \n", "1.8 | \n", "virginica | \n", "
150 rows × 5 columns
\n", "