{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# PyCaret 2 Regression Example\n", "This notebook is created using PyCaret 2.0. Last updated : 28-07-2020" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "pycaret-nightly-0.39\n" ] } ], "source": [ "# check version\n", "from pycaret.utils import version\n", "version()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 1. Loading Dataset" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | age | \n", "sex | \n", "bmi | \n", "children | \n", "smoker | \n", "region | \n", "charges | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "19 | \n", "female | \n", "27.900 | \n", "0 | \n", "yes | \n", "southwest | \n", "16884.92400 | \n", "
1 | \n", "18 | \n", "male | \n", "33.770 | \n", "1 | \n", "no | \n", "southeast | \n", "1725.55230 | \n", "
2 | \n", "28 | \n", "male | \n", "33.000 | \n", "3 | \n", "no | \n", "southeast | \n", "4449.46200 | \n", "
3 | \n", "33 | \n", "male | \n", "22.705 | \n", "0 | \n", "no | \n", "northwest | \n", "21984.47061 | \n", "
4 | \n", "32 | \n", "male | \n", "28.880 | \n", "0 | \n", "no | \n", "northwest | \n", "3866.85520 | \n", "
Description | Value | |
---|---|---|
0 | \n", "session_id | \n", "123 | \n", "
1 | \n", "Transform Target | \n", "False | \n", "
2 | \n", "Transform Target Method | \n", "None | \n", "
3 | \n", "Original Data | \n", "(1338, 7) | \n", "
4 | \n", "Missing Values | \n", "False | \n", "
5 | \n", "Numeric Features | \n", "2 | \n", "
6 | \n", "Categorical Features | \n", "4 | \n", "
7 | \n", "Ordinal Features | \n", "False | \n", "
8 | \n", "High Cardinality Features | \n", "False | \n", "
9 | \n", "High Cardinality Method | \n", "None | \n", "
10 | \n", "Sampled Data | \n", "(1338, 7) | \n", "
11 | \n", "Transformed Train Set | \n", "(936, 16) | \n", "
12 | \n", "Transformed Test Set | \n", "(402, 16) | \n", "
13 | \n", "Numeric Imputer | \n", "mean | \n", "
14 | \n", "Categorical Imputer | \n", "constant | \n", "
15 | \n", "Normalize | \n", "False | \n", "
16 | \n", "Normalize Method | \n", "None | \n", "
17 | \n", "Transformation | \n", "False | \n", "
18 | \n", "Transformation Method | \n", "None | \n", "
19 | \n", "PCA | \n", "False | \n", "
20 | \n", "PCA Method | \n", "None | \n", "
21 | \n", "PCA Components | \n", "None | \n", "
22 | \n", "Ignore Low Variance | \n", "False | \n", "
23 | \n", "Combine Rare Levels | \n", "False | \n", "
24 | \n", "Rare Level Threshold | \n", "None | \n", "
25 | \n", "Numeric Binning | \n", "False | \n", "
26 | \n", "Remove Outliers | \n", "False | \n", "
27 | \n", "Outliers Threshold | \n", "None | \n", "
28 | \n", "Remove Multicollinearity | \n", "False | \n", "
29 | \n", "Multicollinearity Threshold | \n", "None | \n", "
30 | \n", "Clustering | \n", "False | \n", "
31 | \n", "Clustering Iteration | \n", "None | \n", "
32 | \n", "Polynomial Features | \n", "False | \n", "
33 | \n", "Polynomial Degree | \n", "None | \n", "
34 | \n", "Trignometry Features | \n", "False | \n", "
35 | \n", "Polynomial Threshold | \n", "None | \n", "
36 | \n", "Group Features | \n", "False | \n", "
37 | \n", "Feature Selection | \n", "False | \n", "
38 | \n", "Features Selection Threshold | \n", "None | \n", "
39 | \n", "Feature Interaction | \n", "False | \n", "
40 | \n", "Feature Ratio | \n", "False | \n", "
41 | \n", "Interaction Threshold | \n", "None | \n", "
Model | MAE | MSE | RMSE | R2 | RMSLE | MAPE | TT (Sec) | |
---|---|---|---|---|---|---|---|---|
0 | \n", "Gradient Boosting Regressor | \n", "2671.5927 | \n", "23019681.2661 | \n", "4794.6037 | \n", "0.8393 | \n", "0.4439 | \n", "0.3143 | \n", "0.1536 | \n", "
1 | \n", "CatBoost Regressor | \n", "2852.1323 | \n", "25408736.9696 | \n", "5038.5479 | \n", "0.8223 | \n", "0.4896 | \n", "0.3573 | \n", "3.9290 | \n", "
2 | \n", "Random Forest | \n", "2779.2026 | \n", "25351757.1506 | \n", "5032.2587 | \n", "0.8218 | \n", "0.4816 | \n", "0.3432 | \n", "0.5842 | \n", "
3 | \n", "Light Gradient Boosting Machine | \n", "3018.9895 | \n", "25515012.3051 | \n", "5049.8492 | \n", "0.8192 | \n", "0.5534 | \n", "0.3876 | \n", "0.2787 | \n", "
4 | \n", "Extra Trees Regressor | \n", "2755.9265 | \n", "28180447.2658 | \n", "5299.6566 | \n", "0.8043 | \n", "0.4875 | \n", "0.3255 | \n", "0.3242 | \n", "
5 | \n", "AdaBoost Regressor | \n", "4366.1001 | \n", "29298215.0087 | \n", "5411.0606 | \n", "0.7915 | \n", "0.6478 | \n", "0.7662 | \n", "0.0449 | \n", "
6 | \n", "Extreme Gradient Boosting | \n", "3257.2767 | \n", "31489403.0961 | \n", "5610.5079 | \n", "0.7774 | \n", "0.5723 | \n", "0.4072 | \n", "0.1843 | \n", "
7 | \n", "Bayesian Ridge | \n", "4343.5006 | \n", "38542310.2536 | \n", "6196.4607 | \n", "0.7343 | \n", "0.6405 | \n", "0.4436 | \n", "0.0195 | \n", "
8 | \n", "Linear Regression | \n", "4332.7658 | \n", "38549952.0026 | \n", "6197.0842 | \n", "0.7343 | \n", "0.6369 | \n", "0.4415 | \n", "0.0119 | \n", "
9 | \n", "Lasso Regression | \n", "4332.6327 | \n", "38543897.4692 | \n", "6196.6074 | \n", "0.7343 | \n", "0.6404 | \n", "0.4416 | \n", "0.0109 | \n", "
10 | \n", "Ridge Regression | \n", "4339.6093 | \n", "38542499.6202 | \n", "6196.4891 | \n", "0.7343 | \n", "0.6348 | \n", "0.4429 | \n", "0.0088 | \n", "
11 | \n", "TheilSen Regressor | \n", "4124.3658 | \n", "38946435.2631 | \n", "6224.8917 | \n", "0.7327 | \n", "0.5337 | \n", "0.3743 | \n", "3.0722 | \n", "
12 | \n", "Least Angle Regression | \n", "4323.4578 | \n", "40017870.2286 | \n", "6312.0115 | \n", "0.7250 | \n", "0.5647 | \n", "0.4242 | \n", "0.0223 | \n", "
13 | \n", "Lasso Least Angle Regression | \n", "4322.4466 | \n", "40023599.4550 | \n", "6312.5498 | \n", "0.7249 | \n", "0.5401 | \n", "0.4245 | \n", "0.0125 | \n", "
14 | \n", "Decision Tree | \n", "3184.9728 | \n", "44561182.4569 | \n", "6663.2248 | \n", "0.6826 | \n", "0.5343 | \n", "0.3523 | \n", "0.0142 | \n", "
15 | \n", "Huber Regressor | \n", "3478.8635 | \n", "49170605.5859 | \n", "6997.8228 | \n", "0.6590 | \n", "0.4873 | \n", "0.2212 | \n", "0.1435 | \n", "
16 | \n", "Random Sample Consensus | \n", "3467.4036 | \n", "52056856.3074 | \n", "7203.0774 | \n", "0.6382 | \n", "0.4970 | \n", "0.2175 | \n", "0.2620 | \n", "
17 | \n", "Orthogonal Matching Pursuit | \n", "5760.0475 | \n", "57656797.2076 | \n", "7580.0224 | \n", "0.6026 | \n", "0.7426 | \n", "0.8996 | \n", "0.0121 | \n", "
18 | \n", "Passive Aggressive Regressor | \n", "4817.2726 | \n", "59211213.8323 | \n", "7652.9707 | \n", "0.5928 | \n", "0.7577 | \n", "0.4334 | \n", "0.0262 | \n", "
19 | \n", "Elastic Net | \n", "6399.4702 | \n", "72811792.6577 | \n", "8506.2813 | \n", "0.5021 | \n", "0.6789 | \n", "0.8016 | \n", "0.0125 | \n", "
20 | \n", "K Neighbors Regressor | \n", "6858.1227 | \n", "105272520.3363 | \n", "10228.2497 | \n", "0.2784 | \n", "0.7524 | \n", "0.7450 | \n", "0.0115 | \n", "
21 | \n", "Support Vector Machine | \n", "8401.1273 | \n", "163965107.0052 | \n", "12732.6249 | \n", "-0.1092 | \n", "0.9303 | \n", "1.0323 | \n", "0.1238 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "2972.9329 | \n", "24058897.4348 | \n", "4904.9870 | \n", "0.8563 | \n", "0.6083 | \n", "0.3985 | \n", "
1 | \n", "3080.5340 | \n", "29299758.4480 | \n", "5412.9251 | \n", "0.8296 | \n", "0.4459 | \n", "0.3268 | \n", "
2 | \n", "3022.2314 | \n", "27624562.6635 | \n", "5255.9074 | \n", "0.6502 | \n", "0.6822 | \n", "0.4361 | \n", "
3 | \n", "3146.2422 | \n", "25018958.4876 | \n", "5001.8955 | \n", "0.7911 | \n", "0.6398 | \n", "0.5095 | \n", "
4 | \n", "3154.6899 | \n", "28894513.0880 | \n", "5375.3617 | \n", "0.7851 | \n", "0.5901 | \n", "0.3617 | \n", "
5 | \n", "2931.0896 | \n", "21432486.1979 | \n", "4629.5233 | \n", "0.8621 | \n", "0.4131 | \n", "0.2829 | \n", "
6 | \n", "2625.9358 | \n", "20785814.4415 | \n", "4559.1462 | \n", "0.8586 | \n", "0.3891 | \n", "0.3070 | \n", "
7 | \n", "2678.3617 | \n", "24232738.5540 | \n", "4922.6760 | \n", "0.8668 | \n", "0.5098 | \n", "0.2720 | \n", "
8 | \n", "2710.3380 | \n", "21418665.4818 | \n", "4628.0304 | \n", "0.8617 | \n", "0.5574 | \n", "0.4101 | \n", "
9 | \n", "3273.2286 | \n", "29598375.8594 | \n", "5440.4389 | \n", "0.8094 | \n", "0.5916 | \n", "0.3804 | \n", "
Mean | \n", "2959.5584 | \n", "25236477.0656 | \n", "5013.0892 | \n", "0.8171 | \n", "0.5427 | \n", "0.3685 | \n", "
SD | \n", "210.5599 | \n", "3254481.9214 | \n", "324.6755 | \n", "0.0628 | \n", "0.0943 | \n", "0.0703 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "4350.2786 | \n", "34500546.2577 | \n", "5873.7166 | \n", "0.7939 | \n", "0.5089 | \n", "0.4944 | \n", "
1 | \n", "4641.9050 | \n", "44009503.4790 | \n", "6633.9659 | \n", "0.7441 | \n", "0.5455 | \n", "0.4477 | \n", "
2 | \n", "3648.9829 | \n", "28251768.5639 | \n", "5315.2393 | \n", "0.6423 | \n", "0.5941 | \n", "0.5031 | \n", "
3 | \n", "3827.3364 | \n", "25940481.7351 | \n", "5093.1799 | \n", "0.7834 | \n", "0.7211 | \n", "0.5688 | \n", "
4 | \n", "4542.8494 | \n", "41552858.3168 | \n", "6446.1507 | \n", "0.6910 | \n", "0.5138 | \n", "0.4358 | \n", "
5 | \n", "4076.8334 | \n", "34419468.1707 | \n", "5866.8107 | \n", "0.7786 | \n", "0.6157 | \n", "0.3785 | \n", "
6 | \n", "4157.8144 | \n", "39058630.3277 | \n", "6249.6904 | \n", "0.7342 | \n", "0.4905 | \n", "0.4696 | \n", "
7 | \n", "4943.2337 | \n", "45628624.2843 | \n", "6754.8963 | \n", "0.7491 | \n", "0.5550 | \n", "0.4572 | \n", "
8 | \n", "4509.6618 | \n", "39513623.1379 | \n", "6285.9863 | \n", "0.7448 | \n", "0.5580 | \n", "0.5444 | \n", "
9 | \n", "4829.8905 | \n", "45317556.3344 | \n", "6731.8316 | \n", "0.7081 | \n", "0.7059 | \n", "0.5245 | \n", "
Mean | \n", "4352.8786 | \n", "37819306.0608 | \n", "6125.1468 | \n", "0.7370 | \n", "0.5808 | \n", "0.4824 | \n", "
SD | \n", "400.7726 | \n", "6550504.6006 | \n", "549.4390 | \n", "0.0439 | \n", "0.0755 | \n", "0.0535 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "2593.5203 | \n", "18901959.3512 | \n", "4347.6384 | \n", "0.8871 | \n", "0.4122 | \n", "0.3237 | \n", "
1 | \n", "3035.8826 | \n", "30123714.3097 | \n", "5488.5075 | \n", "0.8249 | \n", "0.4577 | \n", "0.3318 | \n", "
2 | \n", "2783.8710 | \n", "21407816.7463 | \n", "4626.8582 | \n", "0.7290 | \n", "0.4923 | \n", "0.4139 | \n", "
3 | \n", "2870.6945 | \n", "21243674.2878 | \n", "4609.0861 | \n", "0.8226 | \n", "0.4748 | \n", "0.4161 | \n", "
4 | \n", "2838.7473 | \n", "24370286.3864 | \n", "4936.6270 | \n", "0.8187 | \n", "0.4455 | \n", "0.3016 | \n", "
5 | \n", "2632.6379 | \n", "18784222.6047 | \n", "4334.0769 | \n", "0.8792 | \n", "0.3588 | \n", "0.2780 | \n", "
6 | \n", "2523.0774 | \n", "19451327.4176 | \n", "4410.3659 | \n", "0.8676 | \n", "0.3888 | \n", "0.3309 | \n", "
7 | \n", "2700.1459 | \n", "24627482.8087 | \n", "4962.6085 | \n", "0.8646 | \n", "0.4674 | \n", "0.3220 | \n", "
8 | \n", "2627.2142 | \n", "19952600.0244 | \n", "4466.8333 | \n", "0.8711 | \n", "0.4601 | \n", "0.3909 | \n", "
9 | \n", "2945.2125 | \n", "25414198.6301 | \n", "5041.2497 | \n", "0.8363 | \n", "0.4971 | \n", "0.3744 | \n", "
Mean | \n", "2755.1004 | \n", "22427728.2567 | \n", "4722.3851 | \n", "0.8401 | \n", "0.4455 | \n", "0.3483 | \n", "
SD | \n", "158.2664 | \n", "3462560.6654 | \n", "356.0994 | \n", "0.0441 | \n", "0.0429 | \n", "0.0452 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "3130.7528 | \n", "39833455.1804 | \n", "6311.3751 | \n", "0.7621 | \n", "0.5067 | \n", "0.3295 | \n", "
1 | \n", "3104.8369 | \n", "45066079.6663 | \n", "6713.1274 | \n", "0.7380 | \n", "0.5410 | \n", "0.3104 | \n", "
2 | \n", "3315.3420 | \n", "47502769.5127 | \n", "6892.2253 | \n", "0.3986 | \n", "0.6452 | \n", "0.4540 | \n", "
3 | \n", "2869.0078 | \n", "40057346.7729 | \n", "6329.0874 | \n", "0.6655 | \n", "0.6043 | \n", "0.5635 | \n", "
4 | \n", "4039.3881 | \n", "64499878.1756 | \n", "8031.1816 | \n", "0.5203 | \n", "0.6590 | \n", "0.5106 | \n", "
5 | \n", "3324.7419 | \n", "41203145.5554 | \n", "6418.9676 | \n", "0.7350 | \n", "0.4916 | \n", "0.3224 | \n", "
6 | \n", "2579.6933 | \n", "38790767.7084 | \n", "6228.2235 | \n", "0.7361 | \n", "0.3911 | \n", "0.2259 | \n", "
7 | \n", "2727.9530 | \n", "35755628.9950 | \n", "5979.6011 | \n", "0.8034 | \n", "0.4698 | \n", "0.1807 | \n", "
8 | \n", "2863.0106 | \n", "38662493.2325 | \n", "6217.9171 | \n", "0.7503 | \n", "0.5113 | \n", "0.4390 | \n", "
9 | \n", "3207.8434 | \n", "47265363.5462 | \n", "6874.9810 | \n", "0.6956 | \n", "0.5121 | \n", "0.2716 | \n", "
Mean | \n", "3116.2570 | \n", "43863692.8345 | \n", "6599.6687 | \n", "0.6805 | \n", "0.5332 | \n", "0.3608 | \n", "
SD | \n", "388.3229 | \n", "7800317.0820 | \n", "555.0368 | \n", "0.1190 | \n", "0.0781 | \n", "0.1191 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "2689.4264 | \n", "22734130.6123 | \n", "4768.0322 | \n", "0.8642 | \n", "0.4756 | \n", "0.3477 | \n", "
1 | \n", "2850.5489 | \n", "30834672.8607 | \n", "5552.8977 | \n", "0.8207 | \n", "0.4683 | \n", "0.2826 | \n", "
2 | \n", "2767.0499 | \n", "24433673.6238 | \n", "4943.0430 | \n", "0.6906 | \n", "0.5459 | \n", "0.3887 | \n", "
3 | \n", "2842.4438 | \n", "24548531.6439 | \n", "4954.6475 | \n", "0.7950 | \n", "0.5165 | \n", "0.4156 | \n", "
4 | \n", "3020.6002 | \n", "30696946.6676 | \n", "5540.4825 | \n", "0.7717 | \n", "0.5602 | \n", "0.3738 | \n", "
5 | \n", "2818.9442 | \n", "22660137.1436 | \n", "4760.2665 | \n", "0.8542 | \n", "0.3712 | \n", "0.2631 | \n", "
6 | \n", "2617.3220 | \n", "22836756.3973 | \n", "4778.7819 | \n", "0.8446 | \n", "0.3874 | \n", "0.3035 | \n", "
7 | \n", "2684.8101 | \n", "24880599.5740 | \n", "4988.0457 | \n", "0.8632 | \n", "0.4451 | \n", "0.2565 | \n", "
8 | \n", "2334.3161 | \n", "18535034.5531 | \n", "4305.2334 | \n", "0.8803 | \n", "0.4357 | \n", "0.3510 | \n", "
9 | \n", "2820.2249 | \n", "29299167.6551 | \n", "5412.8706 | \n", "0.8113 | \n", "0.5072 | \n", "0.3478 | \n", "
Mean | \n", "2744.5686 | \n", "25145965.0731 | \n", "5000.4301 | \n", "0.8196 | \n", "0.4713 | \n", "0.3330 | \n", "
SD | \n", "173.1694 | \n", "3773482.7721 | \n", "376.3829 | \n", "0.0538 | \n", "0.0599 | \n", "0.0515 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "2088.6098 | \n", "25306132.7724 | \n", "5030.5201 | \n", "0.8489 | \n", "0.4360 | \n", "0.2089 | \n", "
1 | \n", "2694.4500 | \n", "37713226.9165 | \n", "6141.1096 | \n", "0.7807 | \n", "0.5023 | \n", "0.2522 | \n", "
2 | \n", "2580.2904 | \n", "31829320.0726 | \n", "5641.7480 | \n", "0.5970 | \n", "0.5954 | \n", "0.3725 | \n", "
3 | \n", "2026.3867 | \n", "22848511.3127 | \n", "4780.0116 | \n", "0.8092 | \n", "0.3817 | \n", "0.1531 | \n", "
4 | \n", "2783.9969 | \n", "36022333.0588 | \n", "6001.8608 | \n", "0.7321 | \n", "0.5899 | \n", "0.3035 | \n", "
5 | \n", "3304.0820 | \n", "42910088.5364 | \n", "6550.5793 | \n", "0.7240 | \n", "0.4398 | \n", "0.2454 | \n", "
6 | \n", "1691.5091 | \n", "21151389.5978 | \n", "4599.0640 | \n", "0.8561 | \n", "0.3226 | \n", "0.1226 | \n", "
7 | \n", "1941.8231 | \n", "22752869.9142 | \n", "4769.9968 | \n", "0.8749 | \n", "0.3608 | \n", "0.1170 | \n", "
8 | \n", "1842.4044 | \n", "20941293.3847 | \n", "4576.1658 | \n", "0.8647 | \n", "0.3641 | \n", "0.2280 | \n", "
9 | \n", "2618.3033 | \n", "36220824.9672 | \n", "6018.3739 | \n", "0.7667 | \n", "0.4830 | \n", "0.2274 | \n", "
Mean | \n", "2357.1856 | \n", "29769599.0533 | \n", "5410.9430 | \n", "0.7854 | \n", "0.4476 | \n", "0.2231 | \n", "
SD | \n", "487.1035 | \n", "7681159.5886 | \n", "700.9244 | \n", "0.0815 | \n", "0.0900 | \n", "0.0753 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "3588.9893 | \n", "27227488.2418 | \n", "5217.9966 | \n", "0.8374 | \n", "0.4474 | \n", "0.3922 | \n", "
1 | \n", "3940.6663 | \n", "37813639.0591 | \n", "6149.2796 | \n", "0.7801 | \n", "0.4662 | \n", "0.3596 | \n", "
2 | \n", "3269.5714 | \n", "23741983.6366 | \n", "4872.5746 | \n", "0.6994 | \n", "0.5131 | \n", "0.4489 | \n", "
3 | \n", "3244.7876 | \n", "21439268.5774 | \n", "4630.2558 | \n", "0.8210 | \n", "0.4892 | \n", "0.4796 | \n", "
4 | \n", "3830.7883 | \n", "34060098.2718 | \n", "5836.1030 | \n", "0.7467 | \n", "0.4980 | \n", "0.3891 | \n", "
5 | \n", "3401.3759 | \n", "27930731.3360 | \n", "5284.9533 | \n", "0.8203 | \n", "0.3718 | \n", "0.3010 | \n", "
6 | \n", "3336.9082 | \n", "29569717.0842 | \n", "5437.8044 | \n", "0.7988 | \n", "0.4217 | \n", "0.3678 | \n", "
7 | \n", "3917.3172 | \n", "32811159.7555 | \n", "5728.1026 | \n", "0.8196 | \n", "0.4431 | \n", "0.3370 | \n", "
8 | \n", "3581.5944 | \n", "28097351.5923 | \n", "5300.6935 | \n", "0.8185 | \n", "0.4762 | \n", "0.4443 | \n", "
9 | \n", "3799.3702 | \n", "32736398.1844 | \n", "5721.5731 | \n", "0.7891 | \n", "0.5125 | \n", "0.3934 | \n", "
Mean | \n", "3591.1369 | \n", "29542783.5739 | \n", "5417.9336 | \n", "0.7931 | \n", "0.4639 | \n", "0.3913 | \n", "
SD | \n", "255.6282 | \n", "4680386.5098 | \n", "434.4866 | \n", "0.0400 | \n", "0.0421 | \n", "0.0516 | \n", "
MAE | MSE | RMSE | R2 | RMSLE | MAPE | |
---|---|---|---|---|---|---|
0 | \n", "2380.8732 | \n", "18718481.7467 | \n", "4326.4861 | \n", "0.8882 | \n", "0.4086 | \n", "0.2976 | \n", "
1 | \n", "3109.8582 | \n", "31556612.9981 | \n", "5617.5273 | \n", "0.8165 | \n", "0.4530 | \n", "0.2955 | \n", "
2 | \n", "2702.5321 | \n", "20963882.3035 | \n", "4578.6332 | \n", "0.7346 | \n", "0.4929 | \n", "0.3608 | \n", "
3 | \n", "2692.8854 | \n", "18683084.0425 | \n", "4322.3933 | \n", "0.8440 | \n", "0.4368 | \n", "0.3712 | \n", "
4 | \n", "2868.0431 | \n", "26287724.0690 | \n", "5127.1556 | \n", "0.8045 | \n", "0.5203 | \n", "0.2937 | \n", "
5 | \n", "2820.1193 | \n", "19939378.8326 | \n", "4465.3532 | \n", "0.8717 | \n", "0.3493 | \n", "0.2744 | \n", "
6 | \n", "2318.3051 | \n", "19772493.7188 | \n", "4446.6272 | \n", "0.8655 | \n", "0.3429 | \n", "0.2549 | \n", "
7 | \n", "2731.4897 | \n", "24424504.7966 | \n", "4942.1154 | \n", "0.8657 | \n", "0.4218 | \n", "0.2370 | \n", "
8 | \n", "2415.7220 | \n", "18218046.2745 | \n", "4268.2603 | \n", "0.8823 | \n", "0.3987 | \n", "0.3020 | \n", "
9 | \n", "2965.2146 | \n", "27042060.4485 | \n", "5200.1981 | \n", "0.8258 | \n", "0.4810 | \n", "0.3027 | \n", "
Mean | \n", "2700.5043 | \n", "22560626.9231 | \n", "4729.4750 | \n", "0.8399 | \n", "0.4305 | \n", "0.2990 | \n", "
SD | \n", "247.0592 | \n", "4292155.0822 | \n", "438.9686 | \n", "0.0442 | \n", "0.0556 | \n", "0.0394 | \n", "
\n", " | Model | \n", "MAE | \n", "MSE | \n", "RMSE | \n", "R2 | \n", "RMSLE | \n", "MAPE | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "Light Gradient Boosting Machine | \n", "2764.0353 | \n", "2.068683e+07 | \n", "4548.2773 | \n", "0.8552 | \n", "0.5223 | \n", "0.3678 | \n", "
\n", " | age | \n", "bmi | \n", "sex_female | \n", "sex_male | \n", "children_0 | \n", "children_1 | \n", "children_2 | \n", "children_3 | \n", "children_4 | \n", "children_5 | \n", "smoker_no | \n", "smoker_yes | \n", "region_northeast | \n", "region_northwest | \n", "region_southeast | \n", "region_southwest | \n", "charges | \n", "Label | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "49.0 | \n", "42.680 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "9800.88820 | \n", "9363.9665 | \n", "
1 | \n", "32.0 | \n", "37.335 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "4667.60765 | \n", "10393.4936 | \n", "
2 | \n", "27.0 | \n", "31.400 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "34838.87300 | \n", "35628.9933 | \n", "
3 | \n", "35.0 | \n", "24.130 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "5125.21570 | \n", "6926.8267 | \n", "
4 | \n", "60.0 | \n", "25.740 | \n", "0.0 | \n", "1.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "12142.57860 | \n", "17508.2783 | \n", "
\n", " | age | \n", "sex | \n", "bmi | \n", "children | \n", "smoker | \n", "region | \n", "Label | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "19 | \n", "female | \n", "27.900 | \n", "0 | \n", "yes | \n", "southwest | \n", "16884.9240 | \n", "
1 | \n", "18 | \n", "male | \n", "33.770 | \n", "1 | \n", "no | \n", "southeast | \n", "1725.5523 | \n", "
2 | \n", "28 | \n", "male | \n", "33.000 | \n", "3 | \n", "no | \n", "southeast | \n", "5138.2567 | \n", "
3 | \n", "33 | \n", "male | \n", "22.705 | \n", "0 | \n", "no | \n", "northwest | \n", "21984.4706 | \n", "
4 | \n", "32 | \n", "male | \n", "28.880 | \n", "0 | \n", "no | \n", "northwest | \n", "3866.8552 | \n", "
Pipeline(memory=None,\n", " steps=[('dtypes',\n", " DataTypes_Auto_infer(categorical_features=[],\n", " display_types=True, features_todrop=[],\n", " ml_usecase='regression',\n", " numerical_features=[], target='charges',\n", " time_features=[])),\n", " ('imputer',\n", " Simple_Imputer(categorical_strategy='not_available',\n", " numeric_strategy='mean',\n", " target_variable=None)),\n", " ('new_levels1',\n", " New_Catagorical_Levels...\n", " ('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\n", " ('P_transform', Empty()), ('pt_target', Empty()),\n", " ('binn', Empty()), ('rem_outliers', Empty()),\n", " ('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\n", " ('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\n", " ('feature_select', Empty()), ('fix_multi', Empty()),\n", " ('dfs', Empty()), ('pca', Empty())],\n", " verbose=False)
DataTypes_Auto_infer(ml_usecase='regression', target='charges')
Simple_Imputer(categorical_strategy='not_available', numeric_strategy='mean',\n", " target_variable=None)
New_Catagorical_Levels_in_TestData(replacement_strategy='least frequent',\n", " target='charges')
Empty()
Empty()
Empty()
Empty()
New_Catagorical_Levels_in_TestData(replacement_strategy='least frequent',\n", " target='charges')
Make_Time_Features(list_of_features=None)
Empty()
Empty()
Empty()
Empty()
Empty()
Empty()
Empty()
Empty()
Dummify(target='charges')
Empty()
Clean_Colum_Names()
Empty()
Empty()
Empty()
Empty()
\n", " | age | \n", "bmi | \n", "sex_female | \n", "sex_male | \n", "children_0 | \n", "children_1 | \n", "children_2 | \n", "children_3 | \n", "children_4 | \n", "children_5 | \n", "smoker_no | \n", "smoker_yes | \n", "region_northeast | \n", "region_northwest | \n", "region_southeast | \n", "region_southwest | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
300 | \n", "36.0 | \n", "27.55 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "
904 | \n", "60.0 | \n", "35.10 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "
670 | \n", "30.0 | \n", "31.57 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "
617 | \n", "49.0 | \n", "25.60 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "
373 | \n", "26.0 | \n", "32.90 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "
\n", " | run_id | \n", "experiment_id | \n", "status | \n", "artifact_uri | \n", "start_time | \n", "end_time | \n", "metrics.MAE | \n", "metrics.R2 | \n", "metrics.RMSE | \n", "metrics.RMSLE | \n", "... | \n", "tags.mlflow.runName | \n", "tags.USI | \n", "tags.Size KB | \n", "tags.URI | \n", "tags.Source | \n", "tags.Final | \n", "tags.Run ID | \n", "tags.mlflow.user | \n", "tags.Run Time | \n", "tags.mlflow.source.name | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "3ceaff2c0be247bca703bf99030e7385 | \n", "1 | \n", "FINISHED | \n", "file:///C:/Users/moezs/pycaret-demo-td/mlruns/... | \n", "2020-07-29 13:56:33.597000+00:00 | \n", "2020-07-29 13:56:34.863000+00:00 | \n", "2357.185600 | \n", "0.785400 | \n", "5410.943000 | \n", "0.447600 | \n", "... | \n", "AdaBoost Regressor | \n", "d354 | \n", "766.67 | \n", "c5ed107e | \n", "finalize_model | \n", "True | \n", "3ceaff2c0be247bca703bf99030e7385 | \n", "moezs | \n", "0.09 | \n", "C:\\Users\\moezs\\Anaconda3\\envs\\pycaret-nightly-... | \n", "
1 | \n", "a7f177d89880493e9947f619d39e6c64 | \n", "1 | \n", "FINISHED | \n", "file:///C:/Users/moezs/pycaret-demo-td/mlruns/... | \n", "2020-07-29 13:55:02.104000+00:00 | \n", "2020-07-29 13:55:02.455000+00:00 | \n", "2852.132294 | \n", "0.822325 | \n", "5038.547940 | \n", "0.489646 | \n", "... | \n", "CatBoost Regressor | \n", "d354 | \n", "1045.05 | \n", "e91b9451 | \n", "compare_models | \n", "None | \n", "a7f177d89880493e9947f619d39e6c64 | \n", "moezs | \n", "17.33 | \n", "C:\\Users\\moezs\\Anaconda3\\envs\\pycaret-nightly-... | \n", "
2 | \n", "9bceee47fc3f425e9e82259f03381d6d | \n", "1 | \n", "FINISHED | \n", "file:///C:/Users/moezs/pycaret-demo-td/mlruns/... | \n", "2020-07-29 13:54:44.359000+00:00 | \n", "2020-07-29 13:54:44.762000+00:00 | \n", "3018.989510 | \n", "0.819169 | \n", "5049.849249 | \n", "0.553369 | \n", "... | \n", "Light Gradient Boosting Machine | \n", "d354 | \n", "270.94 | \n", "e91b9451 | \n", "compare_models | \n", "None | \n", "9bceee47fc3f425e9e82259f03381d6d | \n", "moezs | \n", "1.79 | \n", "C:\\Users\\moezs\\Anaconda3\\envs\\pycaret-nightly-... | \n", "
3 | \n", "7b7973e270194411aee1c67b49a258e8 | \n", "1 | \n", "FINISHED | \n", "file:///C:/Users/moezs/pycaret-demo-td/mlruns/... | \n", "2020-07-29 13:54:42.088000+00:00 | \n", "2020-07-29 13:54:42.557000+00:00 | \n", "3257.276696 | \n", "0.777365 | \n", "5610.507927 | \n", "0.572295 | \n", "... | \n", "Extreme Gradient Boosting | \n", "d354 | \n", "294.45 | \n", "e91b9451 | \n", "compare_models | \n", "None | \n", "7b7973e270194411aee1c67b49a258e8 | \n", "moezs | \n", "1.46 | \n", "C:\\Users\\moezs\\Anaconda3\\envs\\pycaret-nightly-... | \n", "
4 | \n", "8d91720808a74f0ca95a1beafa02af52 | \n", "1 | \n", "FINISHED | \n", "file:///C:/Users/moezs/pycaret-demo-td/mlruns/... | \n", "2020-07-29 13:54:40.283000+00:00 | \n", "2020-07-29 13:54:40.615000+00:00 | \n", "2671.592651 | \n", "0.839292 | \n", "4794.603702 | \n", "0.443938 | \n", "... | \n", "Gradient Boosting Regressor | \n", "d354 | \n", "181.67 | \n", "e91b9451 | \n", "compare_models | \n", "None | \n", "8d91720808a74f0ca95a1beafa02af52 | \n", "moezs | \n", "1.22 | \n", "C:\\Users\\moezs\\Anaconda3\\envs\\pycaret-nightly-... | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
61 | \n", "ca41825ba51049cca2980db4b14f0803 | \n", "1 | \n", "FINISHED | \n", "file:///C:/Users/moezs/pycaret-demo-td/mlruns/... | \n", "2020-07-29 13:47:33.304000+00:00 | \n", "2020-07-29 13:47:33.463000+00:00 | \n", "6399.470189 | \n", "0.502055 | \n", "8506.281322 | \n", "0.678918 | \n", "... | \n", "Elastic Net | \n", "e640 | \n", "12.16 | \n", "46e4ab7a | \n", "compare_models | \n", "None | \n", "ca41825ba51049cca2980db4b14f0803 | \n", "moezs | \n", "0.11 | \n", "C:\\Users\\moezs\\Anaconda3\\envs\\pycaret-nightly-... | \n", "
62 | \n", "220347e92d6d4e15a0689f1996f65be1 | \n", "1 | \n", "FINISHED | \n", "file:///C:/Users/moezs/pycaret-demo-td/mlruns/... | \n", "2020-07-29 13:47:33.064000+00:00 | \n", "2020-07-29 13:47:33.186000+00:00 | \n", "4339.609325 | \n", "0.734330 | \n", "6196.489057 | \n", "0.634846 | \n", "... | \n", "Ridge Regression | \n", "e640 | \n", "11.99 | \n", "46e4ab7a | \n", "compare_models | \n", "None | \n", "220347e92d6d4e15a0689f1996f65be1 | \n", "moezs | \n", "0.1 | \n", "C:\\Users\\moezs\\Anaconda3\\envs\\pycaret-nightly-... | \n", "
63 | \n", "92449063af5b4b7f889b49049567e4fb | \n", "1 | \n", "FINISHED | \n", "file:///C:/Users/moezs/pycaret-demo-td/mlruns/... | \n", "2020-07-29 13:47:32.842000+00:00 | \n", "2020-07-29 13:47:32.958000+00:00 | \n", "4332.632737 | \n", "0.734306 | \n", "6196.607372 | \n", "0.640365 | \n", "... | \n", "Lasso Regression | \n", "e640 | \n", "12.16 | \n", "46e4ab7a | \n", "compare_models | \n", "None | \n", "92449063af5b4b7f889b49049567e4fb | \n", "moezs | \n", "0.11 | \n", "C:\\Users\\moezs\\Anaconda3\\envs\\pycaret-nightly-... | \n", "
64 | \n", "6c6d422e6ab84f6489075246e84b5b88 | \n", "1 | \n", "FINISHED | \n", "file:///C:/Users/moezs/pycaret-demo-td/mlruns/... | \n", "2020-07-29 13:47:32.314000+00:00 | \n", "2020-07-29 13:47:32.729000+00:00 | \n", "4332.765843 | \n", "0.734268 | \n", "6197.084227 | \n", "0.636878 | \n", "... | \n", "Linear Regression | \n", "e640 | \n", "12.16 | \n", "46e4ab7a | \n", "compare_models | \n", "None | \n", "6c6d422e6ab84f6489075246e84b5b88 | \n", "moezs | \n", "0.12 | \n", "C:\\Users\\moezs\\Anaconda3\\envs\\pycaret-nightly-... | \n", "
65 | \n", "076cde0252cb41c9a57a55908c8f3aa3 | \n", "1 | \n", "FINISHED | \n", "file:///C:/Users/moezs/pycaret-demo-td/mlruns/... | \n", "2020-07-29 13:47:20.601000+00:00 | \n", "2020-07-29 13:47:20.806000+00:00 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "... | \n", "Session Initialized e640 | \n", "e640 | \n", "11.44 | \n", "ab172480 | \n", "setup | \n", "None | \n", "076cde0252cb41c9a57a55908c8f3aa3 | \n", "moezs | \n", "4.53 | \n", "C:\\Users\\moezs\\Anaconda3\\envs\\pycaret-nightly-... | \n", "
66 rows × 201 columns
\n", "