{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# PyCaret 2 Regression Example\n", "This notebook is created using PyCaret 2.0. Last updated : 31-07-2020" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "2.0\n" ] } ], "source": [ "# check version\n", "from pycaret.utils import version\n", "version()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 1. Loading Dataset" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | age | \n", "sex | \n", "bmi | \n", "children | \n", "smoker | \n", "region | \n", "charges | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "19 | \n", "female | \n", "27.900 | \n", "0 | \n", "yes | \n", "southwest | \n", "16884.92400 | \n", "
1 | \n", "18 | \n", "male | \n", "33.770 | \n", "1 | \n", "no | \n", "southeast | \n", "1725.55230 | \n", "
2 | \n", "28 | \n", "male | \n", "33.000 | \n", "3 | \n", "no | \n", "southeast | \n", "4449.46200 | \n", "
3 | \n", "33 | \n", "male | \n", "22.705 | \n", "0 | \n", "no | \n", "northwest | \n", "21984.47061 | \n", "
4 | \n", "32 | \n", "male | \n", "28.880 | \n", "0 | \n", "no | \n", "northwest | \n", "3866.85520 | \n", "
Description | Value | |
---|---|---|
0 | \n", "session_id | \n", "123 | \n", "
1 | \n", "Transform Target | \n", "False | \n", "
2 | \n", "Transform Target Method | \n", "None | \n", "
3 | \n", "Original Data | \n", "(1338, 7) | \n", "
4 | \n", "Missing Values | \n", "False | \n", "
5 | \n", "Numeric Features | \n", "2 | \n", "
6 | \n", "Categorical Features | \n", "4 | \n", "
7 | \n", "Ordinal Features | \n", "False | \n", "
8 | \n", "High Cardinality Features | \n", "False | \n", "
9 | \n", "High Cardinality Method | \n", "None | \n", "
10 | \n", "Sampled Data | \n", "(1338, 7) | \n", "
11 | \n", "Transformed Train Set | \n", "(936, 16) | \n", "
12 | \n", "Transformed Test Set | \n", "(402, 16) | \n", "
13 | \n", "Numeric Imputer | \n", "mean | \n", "
14 | \n", "Categorical Imputer | \n", "constant | \n", "
15 | \n", "Normalize | \n", "False | \n", "
16 | \n", "Normalize Method | \n", "None | \n", "
17 | \n", "Transformation | \n", "False | \n", "
18 | \n", "Transformation Method | \n", "None | \n", "
19 | \n", "PCA | \n", "False | \n", "
20 | \n", "PCA Method | \n", "None | \n", "
21 | \n", "PCA Components | \n", "None | \n", "
22 | \n", "Ignore Low Variance | \n", "False | \n", "
23 | \n", "Combine Rare Levels | \n", "False | \n", "
24 | \n", "Rare Level Threshold | \n", "None | \n", "
25 | \n", "Numeric Binning | \n", "False | \n", "
26 | \n", "Remove Outliers | \n", "False | \n", "
27 | \n", "Outliers Threshold | \n", "None | \n", "
28 | \n", "Remove Multicollinearity | \n", "False | \n", "
29 | \n", "Multicollinearity Threshold | \n", "None | \n", "
30 | \n", "Clustering | \n", "False | \n", "
31 | \n", "Clustering Iteration | \n", "None | \n", "
32 | \n", "Polynomial Features | \n", "False | \n", "
33 | \n", "Polynomial Degree | \n", "None | \n", "
34 | \n", "Trignometry Features | \n", "False | \n", "
35 | \n", "Polynomial Threshold | \n", "None | \n", "
36 | \n", "Group Features | \n", "False | \n", "
37 | \n", "Feature Selection | \n", "False | \n", "
38 | \n", "Features Selection Threshold | \n", "None | \n", "
39 | \n", "Feature Interaction | \n", "False | \n", "
40 | \n", "Feature Ratio | \n", "False | \n", "
41 | \n", "Interaction Threshold | \n", "None | \n", "
Model | MAE | MSE | RMSE | R2 | RMSLE | MAPE | TT (Sec) | |
---|---|---|---|---|---|---|---|---|
0 | \n", "Extreme Gradient Boosting | \n", "2666.8675 | \n", "22721899.5305 | \n", "4764.4228 | \n", "0.8410 | \n", "0.4428 | \n", "0.3151 | \n", "0.0429 | \n", "
1 | \n", "Gradient Boosting Regressor | \n", "2671.5927 | \n", "23019681.2661 | \n", "4794.6037 | \n", "0.8393 | \n", "0.4439 | \n", "0.3143 | \n", "0.0683 | \n", "
2 | \n", "CatBoost Regressor | \n", "2814.6048 | \n", "24757340.4659 | \n", "4973.7765 | \n", "0.8265 | \n", "0.4734 | \n", "0.3427 | \n", "1.1286 | \n", "
3 | \n", "Random Forest | \n", "2779.2026 | \n", "25351757.1506 | \n", "5032.2587 | \n", "0.8218 | \n", "0.4816 | \n", "0.3432 | \n", "0.2087 | \n", "
4 | \n", "Light Gradient Boosting Machine | \n", "3018.9895 | \n", "25515012.3051 | \n", "5049.8492 | \n", "0.8192 | \n", "0.5534 | \n", "0.3876 | \n", "0.0815 | \n", "
5 | \n", "Extra Trees Regressor | \n", "2755.9265 | \n", "28180447.2658 | \n", "5299.6566 | \n", "0.8043 | \n", "0.4875 | \n", "0.3255 | \n", "0.1496 | \n", "
6 | \n", "AdaBoost Regressor | \n", "4366.1001 | \n", "29298215.0087 | \n", "5411.0606 | \n", "0.7915 | \n", "0.6478 | \n", "0.7662 | \n", "0.0195 | \n", "
7 | \n", "Ridge Regression | \n", "4339.6093 | \n", "38542499.6202 | \n", "6196.4891 | \n", "0.7343 | \n", "0.6348 | \n", "0.4429 | \n", "0.0036 | \n", "
8 | \n", "Bayesian Ridge | \n", "4343.5006 | \n", "38542310.2536 | \n", "6196.4607 | \n", "0.7343 | \n", "0.6405 | \n", "0.4436 | \n", "0.0058 | \n", "
9 | \n", "Linear Regression | \n", "4332.7658 | \n", "38549952.0026 | \n", "6197.0842 | \n", "0.7343 | \n", "0.6369 | \n", "0.4415 | \n", "0.0043 | \n", "
10 | \n", "Lasso Regression | \n", "4332.6327 | \n", "38543897.4692 | \n", "6196.6074 | \n", "0.7343 | \n", "0.6404 | \n", "0.4416 | \n", "0.0038 | \n", "
11 | \n", "TheilSen Regressor | \n", "4124.3658 | \n", "38946435.2631 | \n", "6224.8917 | \n", "0.7327 | \n", "0.5337 | \n", "0.3743 | \n", "0.7617 | \n", "
12 | \n", "Least Angle Regression | \n", "4323.4578 | \n", "40017870.2286 | \n", "6312.0115 | \n", "0.7250 | \n", "0.5647 | \n", "0.4242 | \n", "0.0062 | \n", "
13 | \n", "Lasso Least Angle Regression | \n", "4322.4466 | \n", "40023599.4550 | \n", "6312.5498 | \n", "0.7249 | \n", "0.5401 | \n", "0.4245 | \n", "0.0060 | \n", "
14 | \n", "Decision Tree | \n", "3184.9728 | \n", "44561182.4569 | \n", "6663.2248 | \n", "0.6826 | \n", "0.5343 | \n", "0.3523 | \n", "0.0050 | \n", "
15 | \n", "Huber Regressor | \n", "3478.8635 | \n", "49170605.5859 | \n", "6997.8228 | \n", "0.6590 | \n", "0.4873 | \n", "0.2212 | \n", "0.0472 | \n", "
16 | \n", "Random Sample Consensus | \n", "3467.4036 | \n", "52056856.3074 | \n", "7203.0774 | \n", "0.6382 | \n", "0.4970 | \n", "0.2175 | \n", "0.0831 | \n", "
17 | \n", "Orthogonal Matching Pursuit | \n", "5760.0475 | \n", "57656797.2076 | \n", "7580.0224 | \n", "0.6026 | \n", "0.7426 | \n", "0.8996 | \n", "0.0034 | \n", "
18 | \n", "Passive Aggressive Regressor | \n", "4817.2726 | \n", "59211213.8323 | \n", "7652.9707 | \n", "0.5928 | \n", "0.7577 | \n", "0.4334 | \n", "0.0068 | \n", "
19 | \n", "Elastic Net | \n", "6399.4702 | \n", "72811792.6577 | \n", "8506.2813 | \n", "0.5021 | \n", "0.6789 | \n", "0.8016 | \n", "0.0030 | \n", "
20 | \n", "K Neighbors Regressor | \n", "6858.1227 | \n", "105272520.3363 | \n", "10228.2497 | \n", "0.2784 | \n", "0.7524 | \n", "0.7450 | \n", "0.0036 | \n", "
21 | \n", "Support Vector Machine | \n", "8401.1273 | \n", "163965107.0052 | \n", "12732.6249 | \n", "-0.1092 | \n", "0.9303 | \n", "1.0323 | \n", "0.0308 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "2972.9329 | \n", "24058897.4348 | \n", "4904.9870 | \n", "0.8563 | \n", "0.6083 | \n", "0.3985 | \n", "
1 | \n", "3080.5340 | \n", "29299758.4480 | \n", "5412.9251 | \n", "0.8296 | \n", "0.4459 | \n", "0.3268 | \n", "
2 | \n", "3022.2314 | \n", "27624562.6635 | \n", "5255.9074 | \n", "0.6502 | \n", "0.6822 | \n", "0.4361 | \n", "
3 | \n", "3146.2422 | \n", "25018958.4876 | \n", "5001.8955 | \n", "0.7911 | \n", "0.6398 | \n", "0.5095 | \n", "
4 | \n", "3154.6899 | \n", "28894513.0880 | \n", "5375.3617 | \n", "0.7851 | \n", "0.5901 | \n", "0.3617 | \n", "
5 | \n", "2931.0896 | \n", "21432486.1979 | \n", "4629.5233 | \n", "0.8621 | \n", "0.4131 | \n", "0.2829 | \n", "
6 | \n", "2625.9358 | \n", "20785814.4415 | \n", "4559.1462 | \n", "0.8586 | \n", "0.3891 | \n", "0.3070 | \n", "
7 | \n", "2678.3617 | \n", "24232738.5540 | \n", "4922.6760 | \n", "0.8668 | \n", "0.5098 | \n", "0.2720 | \n", "
8 | \n", "2710.3380 | \n", "21418665.4818 | \n", "4628.0304 | \n", "0.8617 | \n", "0.5574 | \n", "0.4101 | \n", "
9 | \n", "3273.2286 | \n", "29598375.8594 | \n", "5440.4389 | \n", "0.8094 | \n", "0.5916 | \n", "0.3804 | \n", "
Mean | \n", "2959.5584 | \n", "25236477.0656 | \n", "5013.0892 | \n", "0.8171 | \n", "0.5427 | \n", "0.3685 | \n", "
SD | \n", "210.5599 | \n", "3254481.9214 | \n", "324.6755 | \n", "0.0628 | \n", "0.0943 | \n", "0.0703 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "4202.0830 | \n", "37315426.0049 | \n", "6108.6354 | \n", "0.7771 | \n", "0.6969 | \n", "0.5901 | \n", "
1 | \n", "4164.7622 | \n", "38772693.8976 | \n", "6226.7723 | \n", "0.7746 | \n", "0.6826 | \n", "0.4917 | \n", "
2 | \n", "4545.7489 | \n", "45041923.5654 | \n", "6711.3280 | \n", "0.4297 | \n", "0.9558 | \n", "0.6772 | \n", "
3 | \n", "4390.3370 | \n", "41942311.1362 | \n", "6476.2884 | \n", "0.6498 | \n", "0.7140 | \n", "0.7225 | \n", "
4 | \n", "4617.2417 | \n", "41981223.1575 | \n", "6479.2919 | \n", "0.6878 | \n", "0.6963 | \n", "0.5784 | \n", "
5 | \n", "4166.0225 | \n", "34525507.1405 | \n", "5875.8410 | \n", "0.7779 | \n", "0.6199 | \n", "0.4641 | \n", "
6 | \n", "3916.8456 | \n", "31704830.1337 | \n", "5630.7042 | \n", "0.7843 | \n", "0.7189 | \n", "0.4801 | \n", "
7 | \n", "3689.6088 | \n", "32718649.0173 | \n", "5720.0218 | \n", "0.8201 | \n", "0.6266 | \n", "0.4303 | \n", "
8 | \n", "3995.6685 | \n", "35808315.2188 | \n", "5984.0049 | \n", "0.7687 | \n", "0.9064 | \n", "0.6267 | \n", "
9 | \n", "4616.1772 | \n", "47556279.2763 | \n", "6896.1061 | \n", "0.6937 | \n", "0.8657 | \n", "0.7124 | \n", "
Mean | \n", "4230.4495 | \n", "38736715.8548 | \n", "6210.8994 | \n", "0.7164 | \n", "0.7483 | \n", "0.5773 | \n", "
SD | \n", "296.4153 | \n", "5023332.8140 | \n", "401.8016 | \n", "0.1081 | \n", "0.1117 | \n", "0.1015 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "2593.5203 | \n", "18901959.3512 | \n", "4347.6384 | \n", "0.8871 | \n", "0.4122 | \n", "0.3237 | \n", "
1 | \n", "3035.8826 | \n", "30123714.3097 | \n", "5488.5075 | \n", "0.8249 | \n", "0.4577 | \n", "0.3318 | \n", "
2 | \n", "2783.8710 | \n", "21407816.7463 | \n", "4626.8582 | \n", "0.7290 | \n", "0.4923 | \n", "0.4139 | \n", "
3 | \n", "2870.6945 | \n", "21243674.2878 | \n", "4609.0861 | \n", "0.8226 | \n", "0.4748 | \n", "0.4161 | \n", "
4 | \n", "2838.7473 | \n", "24370286.3864 | \n", "4936.6270 | \n", "0.8187 | \n", "0.4455 | \n", "0.3016 | \n", "
5 | \n", "2632.6379 | \n", "18784222.6047 | \n", "4334.0769 | \n", "0.8792 | \n", "0.3588 | \n", "0.2780 | \n", "
6 | \n", "2523.0774 | \n", "19451327.4176 | \n", "4410.3659 | \n", "0.8676 | \n", "0.3888 | \n", "0.3309 | \n", "
7 | \n", "2700.1459 | \n", "24627482.8087 | \n", "4962.6085 | \n", "0.8646 | \n", "0.4674 | \n", "0.3220 | \n", "
8 | \n", "2627.2142 | \n", "19952600.0244 | \n", "4466.8333 | \n", "0.8711 | \n", "0.4601 | \n", "0.3909 | \n", "
9 | \n", "2945.2125 | \n", "25414198.6301 | \n", "5041.2497 | \n", "0.8363 | \n", "0.4971 | \n", "0.3744 | \n", "
Mean | \n", "2755.1004 | \n", "22427728.2567 | \n", "4722.3851 | \n", "0.8401 | \n", "0.4455 | \n", "0.3483 | \n", "
SD | \n", "158.2664 | \n", "3462560.6654 | \n", "356.0994 | \n", "0.0441 | \n", "0.0429 | \n", "0.0452 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "3130.7528 | \n", "39833455.1804 | \n", "6311.3751 | \n", "0.7621 | \n", "0.5067 | \n", "0.3295 | \n", "
1 | \n", "3104.8369 | \n", "45066079.6663 | \n", "6713.1274 | \n", "0.7380 | \n", "0.5410 | \n", "0.3104 | \n", "
2 | \n", "3315.3420 | \n", "47502769.5127 | \n", "6892.2253 | \n", "0.3986 | \n", "0.6452 | \n", "0.4540 | \n", "
3 | \n", "2869.0078 | \n", "40057346.7729 | \n", "6329.0874 | \n", "0.6655 | \n", "0.6043 | \n", "0.5635 | \n", "
4 | \n", "4039.3881 | \n", "64499878.1756 | \n", "8031.1816 | \n", "0.5203 | \n", "0.6590 | \n", "0.5106 | \n", "
5 | \n", "3324.7419 | \n", "41203145.5554 | \n", "6418.9676 | \n", "0.7350 | \n", "0.4916 | \n", "0.3224 | \n", "
6 | \n", "2579.6933 | \n", "38790767.7084 | \n", "6228.2235 | \n", "0.7361 | \n", "0.3911 | \n", "0.2259 | \n", "
7 | \n", "2727.9530 | \n", "35755628.9950 | \n", "5979.6011 | \n", "0.8034 | \n", "0.4698 | \n", "0.1807 | \n", "
8 | \n", "2863.0106 | \n", "38662493.2325 | \n", "6217.9171 | \n", "0.7503 | \n", "0.5113 | \n", "0.4390 | \n", "
9 | \n", "3207.8434 | \n", "47265363.5462 | \n", "6874.9810 | \n", "0.6956 | \n", "0.5121 | \n", "0.2716 | \n", "
Mean | \n", "3116.2570 | \n", "43863692.8345 | \n", "6599.6687 | \n", "0.6805 | \n", "0.5332 | \n", "0.3608 | \n", "
SD | \n", "388.3229 | \n", "7800317.0820 | \n", "555.0368 | \n", "0.1190 | \n", "0.0781 | \n", "0.1191 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "2689.4264 | \n", "22734130.6123 | \n", "4768.0322 | \n", "0.8642 | \n", "0.4756 | \n", "0.3477 | \n", "
1 | \n", "2850.5489 | \n", "30834672.8607 | \n", "5552.8977 | \n", "0.8207 | \n", "0.4683 | \n", "0.2826 | \n", "
2 | \n", "2767.0499 | \n", "24433673.6238 | \n", "4943.0430 | \n", "0.6906 | \n", "0.5459 | \n", "0.3887 | \n", "
3 | \n", "2842.4438 | \n", "24548531.6439 | \n", "4954.6475 | \n", "0.7950 | \n", "0.5165 | \n", "0.4156 | \n", "
4 | \n", "3020.6002 | \n", "30696946.6676 | \n", "5540.4825 | \n", "0.7717 | \n", "0.5602 | \n", "0.3738 | \n", "
5 | \n", "2818.9442 | \n", "22660137.1436 | \n", "4760.2665 | \n", "0.8542 | \n", "0.3712 | \n", "0.2631 | \n", "
6 | \n", "2617.3220 | \n", "22836756.3973 | \n", "4778.7819 | \n", "0.8446 | \n", "0.3874 | \n", "0.3035 | \n", "
7 | \n", "2684.8101 | \n", "24880599.5740 | \n", "4988.0457 | \n", "0.8632 | \n", "0.4451 | \n", "0.2565 | \n", "
8 | \n", "2334.3161 | \n", "18535034.5531 | \n", "4305.2334 | \n", "0.8803 | \n", "0.4357 | \n", "0.3510 | \n", "
9 | \n", "2820.2249 | \n", "29299167.6551 | \n", "5412.8706 | \n", "0.8113 | \n", "0.5072 | \n", "0.3478 | \n", "
Mean | \n", "2744.5686 | \n", "25145965.0731 | \n", "5000.4301 | \n", "0.8196 | \n", "0.4713 | \n", "0.3330 | \n", "
SD | \n", "173.1694 | \n", "3773482.7721 | \n", "376.3829 | \n", "0.0538 | \n", "0.0599 | \n", "0.0515 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "2088.6098 | \n", "25306132.7724 | \n", "5030.5201 | \n", "0.8489 | \n", "0.4360 | \n", "0.2089 | \n", "
1 | \n", "2694.4500 | \n", "37713226.9165 | \n", "6141.1096 | \n", "0.7807 | \n", "0.5023 | \n", "0.2522 | \n", "
2 | \n", "2580.2904 | \n", "31829320.0726 | \n", "5641.7480 | \n", "0.5970 | \n", "0.5954 | \n", "0.3725 | \n", "
3 | \n", "2026.3867 | \n", "22848511.3127 | \n", "4780.0116 | \n", "0.8092 | \n", "0.3817 | \n", "0.1531 | \n", "
4 | \n", "2783.9969 | \n", "36022333.0588 | \n", "6001.8608 | \n", "0.7321 | \n", "0.5899 | \n", "0.3035 | \n", "
5 | \n", "3304.0820 | \n", "42910088.5364 | \n", "6550.5793 | \n", "0.7240 | \n", "0.4398 | \n", "0.2454 | \n", "
6 | \n", "1691.5091 | \n", "21151389.5978 | \n", "4599.0640 | \n", "0.8561 | \n", "0.3226 | \n", "0.1226 | \n", "
7 | \n", "1941.8231 | \n", "22752869.9142 | \n", "4769.9968 | \n", "0.8749 | \n", "0.3608 | \n", "0.1170 | \n", "
8 | \n", "1842.4044 | \n", "20941293.3847 | \n", "4576.1658 | \n", "0.8647 | \n", "0.3641 | \n", "0.2280 | \n", "
9 | \n", "2618.3033 | \n", "36220824.9672 | \n", "6018.3739 | \n", "0.7667 | \n", "0.4830 | \n", "0.2274 | \n", "
Mean | \n", "2357.1856 | \n", "29769599.0533 | \n", "5410.9430 | \n", "0.7854 | \n", "0.4476 | \n", "0.2231 | \n", "
SD | \n", "487.1035 | \n", "7681159.5886 | \n", "700.9244 | \n", "0.0815 | \n", "0.0900 | \n", "0.0753 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "3567.6029 | \n", "27065352.2604 | \n", "5202.4371 | \n", "0.8383 | \n", "0.4429 | \n", "0.3872 | \n", "
1 | \n", "3948.5443 | \n", "38042231.7924 | \n", "6167.8385 | \n", "0.7788 | \n", "0.4681 | \n", "0.3602 | \n", "
2 | \n", "3248.6907 | \n", "23594846.3548 | \n", "4857.4527 | \n", "0.7013 | \n", "0.5082 | \n", "0.4408 | \n", "
3 | \n", "3228.9006 | \n", "21265240.6874 | \n", "4611.4250 | \n", "0.8224 | \n", "0.4846 | \n", "0.4734 | \n", "
4 | \n", "3810.7794 | \n", "33931591.3072 | \n", "5825.0829 | \n", "0.7476 | \n", "0.4926 | \n", "0.3832 | \n", "
5 | \n", "3393.4626 | \n", "27950743.3064 | \n", "5286.8463 | \n", "0.8202 | \n", "0.3729 | \n", "0.3003 | \n", "
6 | \n", "3321.4944 | \n", "29360441.7289 | \n", "5418.5276 | \n", "0.8002 | \n", "0.4215 | \n", "0.3687 | \n", "
7 | \n", "3924.0898 | \n", "32840540.1406 | \n", "5730.6666 | \n", "0.8194 | \n", "0.4448 | \n", "0.3407 | \n", "
8 | \n", "3590.2695 | \n", "28114541.8115 | \n", "5302.3148 | \n", "0.8184 | \n", "0.4747 | \n", "0.4435 | \n", "
9 | \n", "3792.9335 | \n", "32627264.4348 | \n", "5712.0280 | \n", "0.7898 | \n", "0.5095 | \n", "0.3913 | \n", "
Mean | \n", "3582.6768 | \n", "29479279.3824 | \n", "5411.4620 | \n", "0.7937 | \n", "0.4620 | \n", "0.3889 | \n", "
SD | \n", "262.2343 | \n", "4759119.6736 | \n", "441.9942 | \n", "0.0397 | \n", "0.0403 | \n", "0.0493 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "2564.5809 | \n", "20266074.9345 | \n", "4501.7857 | \n", "0.8790 | \n", "0.4370 | \n", "0.3141 | \n", "
1 | \n", "2934.3770 | \n", "31081553.1267 | \n", "5575.0832 | \n", "0.8193 | \n", "0.4979 | \n", "0.2816 | \n", "
2 | \n", "2670.1672 | \n", "23415471.9712 | \n", "4838.9536 | \n", "0.7035 | \n", "0.5099 | \n", "0.3105 | \n", "
3 | \n", "2798.8665 | \n", "21176854.5981 | \n", "4601.8317 | \n", "0.8232 | \n", "0.4631 | \n", "0.3736 | \n", "
4 | \n", "2894.4125 | \n", "27549639.0133 | \n", "5248.7750 | \n", "0.7951 | \n", "0.5208 | \n", "0.3140 | \n", "
5 | \n", "2684.3001 | \n", "20037070.5693 | \n", "4476.2787 | \n", "0.8711 | \n", "0.4571 | \n", "0.2697 | \n", "
6 | \n", "2458.3706 | \n", "19953697.9106 | \n", "4466.9562 | \n", "0.8642 | \n", "0.3486 | \n", "0.2697 | \n", "
7 | \n", "2744.8664 | \n", "25598490.3265 | \n", "5059.4951 | \n", "0.8592 | \n", "0.4347 | \n", "0.2507 | \n", "
8 | \n", "2341.0738 | \n", "17775685.5344 | \n", "4216.1221 | \n", "0.8852 | \n", "0.3964 | \n", "0.3114 | \n", "
9 | \n", "2994.9821 | \n", "27582079.6067 | \n", "5251.8644 | \n", "0.8223 | \n", "0.5355 | \n", "0.3599 | \n", "
Mean | \n", "2708.5997 | \n", "23443661.7591 | \n", "4823.7146 | \n", "0.8322 | \n", "0.4601 | \n", "0.3055 | \n", "
SD | \n", "199.3687 | \n", "4100160.4270 | \n", "418.8550 | \n", "0.0515 | \n", "0.0557 | \n", "0.0373 | \n", "
\n", " | Model | \n", "MAE | \n", "MSE | \n", "RMSE | \n", "R2 | \n", "RMSLE | \n", "MAPE | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "Light Gradient Boosting Machine | \n", "2764.0353 | \n", "2.068683e+07 | \n", "4548.2773 | \n", "0.8552 | \n", "0.5223 | \n", "0.3678 | \n", "
\n", " | age | \n", "bmi | \n", "sex_female | \n", "sex_male | \n", "children_0 | \n", "children_1 | \n", "children_2 | \n", "children_3 | \n", "children_4 | \n", "children_5 | \n", "smoker_no | \n", "smoker_yes | \n", "region_northeast | \n", "region_northwest | \n", "region_southeast | \n", "region_southwest | \n", "charges | \n", "Label | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "49.0 | \n", "42.680 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "9800.88820 | \n", "9363.9665 | \n", "
1 | \n", "32.0 | \n", "37.335 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "4667.60765 | \n", "10393.4936 | \n", "
2 | \n", "27.0 | \n", "31.400 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "34838.87300 | \n", "35628.9933 | \n", "
3 | \n", "35.0 | \n", "24.130 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "5125.21570 | \n", "6926.8267 | \n", "
4 | \n", "60.0 | \n", "25.740 | \n", "0.0 | \n", "1.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "12142.57860 | \n", "17508.2783 | \n", "
\n", " | age | \n", "sex | \n", "bmi | \n", "children | \n", "smoker | \n", "region | \n", "Label | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "19 | \n", "female | \n", "27.900 | \n", "0 | \n", "yes | \n", "southwest | \n", "16884.9240 | \n", "
1 | \n", "18 | \n", "male | \n", "33.770 | \n", "1 | \n", "no | \n", "southeast | \n", "1725.5523 | \n", "
2 | \n", "28 | \n", "male | \n", "33.000 | \n", "3 | \n", "no | \n", "southeast | \n", "5138.2567 | \n", "
3 | \n", "33 | \n", "male | \n", "22.705 | \n", "0 | \n", "no | \n", "northwest | \n", "21984.4706 | \n", "
4 | \n", "32 | \n", "male | \n", "28.880 | \n", "0 | \n", "no | \n", "northwest | \n", "3866.8552 | \n", "
Pipeline(memory=None,\n", " steps=[('dtypes',\n", " DataTypes_Auto_infer(categorical_features=[],\n", " display_types=True, features_todrop=[],\n", " ml_usecase='regression',\n", " numerical_features=[], target='charges',\n", " time_features=[])),\n", " ('imputer',\n", " Simple_Imputer(categorical_strategy='not_available',\n", " numeric_strategy='mean',\n", " target_variable=None)),\n", " ('new_levels1',\n", " New_Catagorical_Levels...\n", " ('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\n", " ('P_transform', Empty()), ('pt_target', Empty()),\n", " ('binn', Empty()), ('rem_outliers', Empty()),\n", " ('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\n", " ('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\n", " ('feature_select', Empty()), ('fix_multi', Empty()),\n", " ('dfs', Empty()), ('pca', Empty())],\n", " verbose=False)
DataTypes_Auto_infer(ml_usecase='regression', target='charges')
Simple_Imputer(categorical_strategy='not_available', numeric_strategy='mean',\n", " target_variable=None)
New_Catagorical_Levels_in_TestData(replacement_strategy='least frequent',\n", " target='charges')
Empty()
Empty()
Empty()
Empty()
New_Catagorical_Levels_in_TestData(replacement_strategy='least frequent',\n", " target='charges')
Make_Time_Features(list_of_features=None)
Empty()
Empty()
Empty()
Empty()
Empty()
Empty()
Empty()
Empty()
Dummify(target='charges')
Empty()
Clean_Colum_Names()
Empty()
Empty()
Empty()
Empty()
\n", " | age | \n", "bmi | \n", "sex_female | \n", "sex_male | \n", "children_0 | \n", "children_1 | \n", "children_2 | \n", "children_3 | \n", "children_4 | \n", "children_5 | \n", "smoker_no | \n", "smoker_yes | \n", "region_northeast | \n", "region_northwest | \n", "region_southeast | \n", "region_southwest | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
300 | \n", "36.0 | \n", "27.55 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "
904 | \n", "60.0 | \n", "35.10 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "
670 | \n", "30.0 | \n", "31.57 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "
617 | \n", "49.0 | \n", "25.60 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "
373 | \n", "26.0 | \n", "32.90 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "