{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# PyCaret 2 Clustering Example\n", "This notebook is created using PyCaret 2.0. Last updated : 28-07-2020" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "pycaret-nightly-0.39\n" ] } ], "source": [ "# check version\n", "from pycaret.utils import version\n", "version()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 1. Loading Dataset" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
Country Name199519961997199819992000200120022003...2005200620072008200920102011201220132014
0Arab World2.0048682.0146022.0713092.1777122.3310002.3335962.5887512.5402382.450415...2.1342812.1330382.1668722.1012332.8300672.4896312.5395702.7112622.8954273.073161
1Caribbean small states2.8015182.8566842.9971572.9894512.7678582.8267522.6799692.8886932.740593...2.6295802.6509002.7906652.8229133.4086513.2640643.0876533.3143033.3184323.260012
2Central Europe and the Baltics4.6785284.7532094.6045744.4999884.6790824.5397114.6662724.9001965.100249...4.9708614.8414504.8090575.0547855.3949215.2843805.0962125.0413175.0292665.017717
3Early-demographic dividend2.2031642.1566322.2273112.3641002.4543942.4505552.5270812.3477022.363263...2.3373472.3698842.3852512.4051262.7012602.5071312.4954912.4973402.5867012.665603
4East Asia & Pacific4.4290904.2031524.2443514.4539844.6269204.6888494.6847904.6135374.635098...4.5662154.3671464.2973944.4348484.8652414.7758174.8717274.8668694.6432214.571448
\n", "

5 rows × 21 columns

\n", "
" ], "text/plain": [ " Country Name 1995 1996 1997 1998 \\\n", "0 Arab World 2.004868 2.014602 2.071309 2.177712 \n", "1 Caribbean small states 2.801518 2.856684 2.997157 2.989451 \n", "2 Central Europe and the Baltics 4.678528 4.753209 4.604574 4.499988 \n", "3 Early-demographic dividend 2.203164 2.156632 2.227311 2.364100 \n", "4 East Asia & Pacific 4.429090 4.203152 4.244351 4.453984 \n", "\n", " 1999 2000 2001 2002 2003 ... 2005 2006 \\\n", "0 2.331000 2.333596 2.588751 2.540238 2.450415 ... 2.134281 2.133038 \n", "1 2.767858 2.826752 2.679969 2.888693 2.740593 ... 2.629580 2.650900 \n", "2 4.679082 4.539711 4.666272 4.900196 5.100249 ... 4.970861 4.841450 \n", "3 2.454394 2.450555 2.527081 2.347702 2.363263 ... 2.337347 2.369884 \n", "4 4.626920 4.688849 4.684790 4.613537 4.635098 ... 4.566215 4.367146 \n", "\n", " 2007 2008 2009 2010 2011 2012 2013 \\\n", "0 2.166872 2.101233 2.830067 2.489631 2.539570 2.711262 2.895427 \n", "1 2.790665 2.822913 3.408651 3.264064 3.087653 3.314303 3.318432 \n", "2 4.809057 5.054785 5.394921 5.284380 5.096212 5.041317 5.029266 \n", "3 2.385251 2.405126 2.701260 2.507131 2.495491 2.497340 2.586701 \n", "4 4.297394 4.434848 4.865241 4.775817 4.871727 4.866869 4.643221 \n", "\n", " 2014 \n", "0 3.073161 \n", "1 3.260012 \n", "2 5.017717 \n", "3 2.665603 \n", "4 4.571448 \n", "\n", "[5 rows x 21 columns]" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "from pycaret.datasets import get_data\n", "data = get_data('public_health')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 2. Initialize Setup" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Setup Succesfully Completed!\n" ] }, { "data": { "text/html": [ "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
Description Value
0session_id 123
1Original Data (224, 21)
2Missing Values False
3Numeric Features 20
4Categorical Features 1
5Ordinal Features False
6High Cardinality Features False
7Transformed Data (224, 20)
8Numeric Imputer mean
9Categorical Imputer constant
10Normalize False
11Normalize Method None
12Transformation False
13Transformation Method None
14PCA False
15PCA Method None
16PCA components None
17Ignore Low Variance False
18Combine Rare Levels False
19Rare Level Threshold None
20Numeric Binning False
21Remove Multicollinearity False
22Multicollinearity Threshold None
23Group Features False
" ], "text/plain": [ "" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "from pycaret.clustering import *\n", "clu1 = setup(data, ignore_features = ['Country Name'], session_id=123, log_experiment=True, log_plots = True, experiment_name='health1')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 3. Create Model" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
NameReference
ID
kmeansK-Means Clusteringsklearn.cluster.KMeans
apAffinity Propagationsklearn.cluster.AffinityPropagation
meanshiftMean shift Clusteringsklearn.cluster.MeanShift
scSpectral Clusteringsklearn.cluster.SpectralClustering
hclustAgglomerative Clusteringsklearn.cluster.AgglomerativeClustering
dbscanDensity-Based Spatial Clusteringsklearn.cluster.DBSCAN
opticsOPTICS Clusteringsklearn.cluster.OPTICS
birchBirch Clusteringsklearn.cluster.Birch
kmodesK-Modes Clusteringgit/nicodv/kmodes
\n", "
" ], "text/plain": [ " Name \\\n", "ID \n", "kmeans K-Means Clustering \n", "ap Affinity Propagation \n", "meanshift Mean shift Clustering \n", "sc Spectral Clustering \n", "hclust Agglomerative Clustering \n", "dbscan Density-Based Spatial Clustering \n", "optics OPTICS Clustering \n", "birch Birch Clustering \n", "kmodes K-Modes Clustering \n", "\n", " Reference \n", "ID \n", "kmeans sklearn.cluster.KMeans \n", "ap sklearn.cluster.AffinityPropagation \n", "meanshift sklearn.cluster.MeanShift \n", "sc sklearn.cluster.SpectralClustering \n", "hclust sklearn.cluster.AgglomerativeClustering \n", "dbscan sklearn.cluster.DBSCAN \n", "optics sklearn.cluster.OPTICS \n", "birch sklearn.cluster.Birch \n", "kmodes git/nicodv/kmodes " ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "models()" ] }, { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
Metric
Silhouette0.4335
Calinski-Harabasz322.9575
Davies-Bouldin0.7471
\n", "
" ], "text/plain": [ " Metric\n", "Silhouette 0.4335\n", "Calinski-Harabasz 322.9575\n", "Davies-Bouldin 0.7471" ] }, "metadata": {}, "output_type": "display_data" }, { "data": { "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "kmeans = create_model('kmeans', num_clusters = 4)" ] }, { "cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
Metric
Silhouette-0.3632
Calinski-Harabasz1.2468
Davies-Bouldin1.2297
\n", "
" ], "text/plain": [ " Metric\n", "Silhouette -0.3632\n", "Calinski-Harabasz 1.2468\n", "Davies-Bouldin 1.2297" ] }, "metadata": {}, "output_type": "display_data" }, { "data": { "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "kmodes = create_model('kmodes', num_clusters = 4)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 4. Assign Labels" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
Country Name199519961997199819992000200120022003...200620072008200920102011201220132014Cluster
0Arab World2.0048682.0146022.0713092.1777122.3310002.3335962.5887512.5402382.450415...2.1330382.1668722.1012332.8300672.4896312.5395702.7112622.8954273.073161Cluster 2
1Caribbean small states2.8015182.8566842.9971572.9894512.7678582.8267522.6799692.8886932.740593...2.6509002.7906652.8229133.4086513.2640643.0876533.3143033.3184323.260012Cluster 2
2Central Europe and the Baltics4.6785284.7532094.6045744.4999884.6790824.5397114.6662724.9001965.100249...4.8414504.8090575.0547855.3949215.2843805.0962125.0413175.0292665.017717Cluster 0
3Early-demographic dividend2.2031642.1566322.2273112.3641002.4543942.4505552.5270812.3477022.363263...2.3698842.3852512.4051262.7012602.5071312.4954912.4973402.5867012.665603Cluster 2
4East Asia & Pacific4.4290904.2031524.2443514.4539844.6269204.6888494.6847904.6135374.635098...4.3671464.2973944.4348484.8652414.7758174.8717274.8668694.6432214.571448Cluster 0
\n", "

5 rows × 22 columns

\n", "
" ], "text/plain": [ " Country Name 1995 1996 1997 1998 \\\n", "0 Arab World 2.004868 2.014602 2.071309 2.177712 \n", "1 Caribbean small states 2.801518 2.856684 2.997157 2.989451 \n", "2 Central Europe and the Baltics 4.678528 4.753209 4.604574 4.499988 \n", "3 Early-demographic dividend 2.203164 2.156632 2.227311 2.364100 \n", "4 East Asia & Pacific 4.429090 4.203152 4.244351 4.453984 \n", "\n", " 1999 2000 2001 2002 2003 ... 2006 2007 \\\n", "0 2.331000 2.333596 2.588751 2.540238 2.450415 ... 2.133038 2.166872 \n", "1 2.767858 2.826752 2.679969 2.888693 2.740593 ... 2.650900 2.790665 \n", "2 4.679082 4.539711 4.666272 4.900196 5.100249 ... 4.841450 4.809057 \n", "3 2.454394 2.450555 2.527081 2.347702 2.363263 ... 2.369884 2.385251 \n", "4 4.626920 4.688849 4.684790 4.613537 4.635098 ... 4.367146 4.297394 \n", "\n", " 2008 2009 2010 2011 2012 2013 2014 \\\n", "0 2.101233 2.830067 2.489631 2.539570 2.711262 2.895427 3.073161 \n", "1 2.822913 3.408651 3.264064 3.087653 3.314303 3.318432 3.260012 \n", "2 5.054785 5.394921 5.284380 5.096212 5.041317 5.029266 5.017717 \n", "3 2.405126 2.701260 2.507131 2.495491 2.497340 2.586701 2.665603 \n", "4 4.434848 4.865241 4.775817 4.871727 4.866869 4.643221 4.571448 \n", "\n", " Cluster \n", "0 Cluster 2 \n", "1 Cluster 2 \n", "2 Cluster 0 \n", "3 Cluster 2 \n", "4 Cluster 0 \n", "\n", "[5 rows x 22 columns]" ] }, "execution_count": 7, "metadata": {}, "output_type": "execute_result" } ], "source": [ "kmeans_results = assign_model(kmeans)\n", "kmeans_results.head()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 5. Analyze Model" ] }, { "cell_type": "code", "execution_count": 8, "metadata": {}, "outputs": [ { "data": { "text/html": [ " \n", " " ] }, "metadata": {}, "output_type": "display_data" }, { "data": { "application/vnd.plotly.v1+json": { "config": { "plotlyServerURL": "https://plot.ly" }, "data": [ { "customdata": [ [ "Honduras" ], [ "Dominica" ], [ "Djibouti" ], [ "Samoa" ], [ "San Marino" ], [ "Sao Tome and Principe" ], [ "Colombia" ], [ "Chile" ], [ "Cabo Verde" ], [ "Solomon Islands" ], [ "Bulgaria" ], [ "South Africa" ], [ "Brazil" ], [ "Botswana" ], [ "Bolivia" ], [ "Bhutan" ], [ "Belarus" ], [ "Barbados" ], [ "St. Lucia" ], [ "St. Vincent and the Grenadines" ], [ "Russian Federation" ], [ "Suriname" ], [ "Romania" ], [ "Estonia" ], [ "Moldova" ], [ "Malawi" ], [ "Monaco" ], [ "Macedonia, FYR" ], [ "Lithuania" ], [ "Lebanon" ], [ "Latvia" ], [ "Montenegro" ], [ "Mozambique" ], [ "Namibia" ], [ "Jordan" ], [ "Israel" ], [ "Nicaragua" ], [ "Hungary" ], [ "Guyana" ], [ "Grenada" ], [ "Panama" ], [ "Papua New Guinea" ], [ "Poland" ], [ "El Salvador" ], [ "Argentina" ], [ "Seychelles" ], [ "Swaziland" ], [ "Small states" ], [ "Tonga" ], [ "Vanuatu" ], [ "Pacific island small states" ], [ "Other small states" ], [ "Tunisia" ], [ "East Asia & Pacific" ], [ "Turkey" ], [ "Ukraine" ], [ "Antigua and Barbuda" ], [ "Europe & Central Asia (IDA & IBRD countries)" ], [ "Latin America & the Caribbean (IDA & IBRD countries)" ], [ "Latin America & Caribbean (excluding high income)" ], [ "Latin America & Caribbean" ], [ "Europe & Central Asia (excluding high income)" ], [ "Thailand" ], [ "Uruguay" ], [ "Central Europe and the Baltics" ], [ "Algeria" ], [ "Andorra" ] ], "hovertemplate": "Cluster=Cluster 0
PCA1=%{x}
PCA2=%{y}
Feature=%{customdata[0]}", "legendgroup": "Cluster 0", "marker": { "color": "#636efa", "opacity": 0.5, "symbol": "circle" }, "mode": "markers", "name": "Cluster 0", "orientation": "v", "showlegend": true, "textposition": "top center", "type": "scatter", "x": [ 0.0523809767042203, -0.6963165842730611, 3.4963629024504157, 2.239179963842626, 2.996541555817924, -1.982879767134111, 5.269249366144288, -2.982481930004971, -0.5993207982455239, 6.323109784117417, 0.9043237858037494, -0.41674848743597237, -1.8325711391061783, -1.686965814851076, -0.8536612634039066, 2.8846255739114053, 3.0973104640228657, 0.5412716246977549, -1.7848088812854825, -0.5138111571569077, -0.36390899901084006, 0.040582767506344375, 0.7748426086098928, 3.7119153029666663, 4.882710147013893, 3.4211056709118535, -2.011887424842368, 4.811797590024579, 3.3977115784363083, -1.0594868777708515, -0.15053431117056518, 5.521664440212993, -1.5422464279154837, 2.475123168426273, 6.3793604633161785, 4.232365223943223, -0.4234591695205206, 6.877428452111309, 2.7628508172347273, -2.710078590714615, 6.182900164693898, 1.7357732814693132, 2.8915650781047106, 0.4067357117267071, 1.6549886134245433, -0.6367154259911892, 3.477841724858415, -2.8033488749931306, 0.688224693343187, -2.679774235079104, 2.521124354529939, -2.678082879662622, -2.260400608016421, 3.7321855099220653, -0.4374089529823035, 0.6817178664409335, -2.7904247938703306, 0.18827377624908267, -2.334515940063102, -2.0788610562518857, -2.0866140147954266, -0.5707423499700737, -0.13082493573547338, 3.753184859247307, 5.19653204627169, -2.5644440390142282, 4.883437593508746 ], "xaxis": "x", "y": [ -1.0061914536857364, 1.5305671961061875, -3.0016842207799743, -1.6875356484840207, -0.2740310411662722, 1.7913403986410694, 1.3359849927496932, 0.16091627846989195, 2.2543298469994255, -1.5474141205241485, 0.5730460663408711, 0.11355576223380467, -0.4294276179163997, -0.45382741503654317, -0.5170665696550727, 3.8566195969433834, 3.1486955568002464, -0.5683861330013134, 0.03129894274702836, -0.06757513689428422, 1.657514000735274, 4.7341680137885565, -1.2385442803297109, 1.264358496837327, 0.25926155597166634, -6.448804007521148, -0.4154591228405269, 3.387338823334593, 0.9531860986338618, 2.9931221367653293, 0.8003393682777394, 4.121262186928553, 1.9141130390493308, 0.5760168892285199, 0.7145199934098242, 1.70042370692386, -1.0957750164154723, 2.506866811798524, 2.1863935441044426, 1.9233874084159046, 0.6587191354538705, 1.377242221635593, 0.24184140169870277, -0.5631591457580744, 3.973969905401959, 3.142590570320148, -5.131259458682053, 1.503215156474529, 0.23043470667369545, -0.9892378763665283, 0.519385857240113, 1.7809406740110842, -0.8410240643570489, 0.9928267617964195, -1.8311715877970052, 1.1596543184112722, -0.6084592632583561, 0.7463734591250084, 0.13891010566730913, 0.12929841063543973, 0.09429419110350006, 0.6820820860708171, -3.706588405460558, -4.1531049826228665, 0.7126585487039374, -2.1296685616125792, -2.433941599042843 ], "yaxis": "y" }, { "customdata": [ [ "Micronesia, Fed. Sts." ], [ "Kiribati" ], [ "Finland" ], [ "France" ], [ "United Kingdom" ], [ "Germany" ], [ "Malta" ], [ "Greece" ], [ "Portugal" ], [ "Austria" ], [ "European Union" ], [ "Japan" ], [ "Australia" ], [ "Norway" ], [ "Netherlands" ], [ "United States" ], [ "Iceland" ], [ "Italy" ], [ "High income" ], [ "New Zealand" ], [ "Palau" ], [ "World" ], [ "Sweden" ], [ "Cuba" ], [ "Switzerland" ], [ "Slovak Republic" ], [ "Post-demographic dividend" ], [ "Serbia" ], [ "Spain" ], [ "Lesotho" ], [ "Europe & Central Asia" ], [ "Maldives" ], [ "Costa Rica" ], [ "Canada" ], [ "OECD members" ], [ "Croatia" ], [ "Ireland" ], [ "North America" ], [ "Czech Republic" ], [ "Denmark" ], [ "Euro area" ], [ "Belgium" ], [ "Slovenia" ], [ "Bosnia and Herzegovina" ], [ "Luxembourg" ] ], "hovertemplate": "Cluster=Cluster 1
PCA1=%{x}
PCA2=%{y}
Feature=%{customdata[0]}", "legendgroup": "Cluster 1", "marker": { "color": "#EF553B", "opacity": 0.5, "symbol": "circle" }, "mode": "markers", "name": "Cluster 1", "orientation": "v", "showlegend": true, "textposition": "top center", "type": "scatter", "x": [ 28.0262695538832, 23.420927418009597, 10.726724560722625, 20.274410375468314, 12.929593082081045, 19.694842954903077, 7.314091778152733, 7.186477299903722, 11.14119297927542, 18.367344502907944, 14.943239114650703, 13.813253198680279, 8.675223471375858, 16.671662050148086, 14.383614043780405, 14.058971232804135, 15.946916758968193, 11.481683009232073, 13.138218186033123, 15.482183362753911, 13.858864478915562, 8.629457309687261, 18.38721009205912, 16.80945641164693, 11.69398831763859, 7.34823407837088, 13.808128624207797, 7.64716251857974, 10.043412321500618, 7.060532218142876, 13.234086657329984, 7.472880926088071, 10.217763125731786, 13.95454071375664, 13.114383027129241, 10.475304935117329, 7.171364571949278, 14.032324057252538, 10.210283019050978, 20.07095230754882, 15.823770054445614, 14.600979477284383, 11.318080992622432, 7.014345778510733, 10.746653539988584 ], "xaxis": "x", "y": [ -6.041878648963877, 1.823268170516312, -1.030749695397637, 0.5893161257926888, -2.2661386247236397, 1.2426452203194973, -1.6944069348771362, -1.361353560999246, -0.3178429143929311, 0.21312339635189195, -0.41168663466966343, -2.6865792296916515, -0.3696795752168184, 0.444650157035873, -6.075816075638619, -2.128293361440676, 2.1692216402280793, -1.2206793438921009, -1.1393786999588782, -4.743207341003983, 3.4424525494613616, 0.39461364528283294, -2.2006955984502494, -6.478083184227868, -1.83393087984684, 0.6291036683252442, -1.4098865373330882, -1.462348094961733, -0.9687378170947273, -6.859660089106432, 0.26416370258018984, -4.919417342361275, -1.1138186475250478, -0.6679680569801177, -1.2698155947760223, 0.35135324468989126, -0.25585213517749955, -2.0055644357724742, 0.9972888247732347, -2.057592902176683, -0.144709221609351, -1.8679602899905683, 0.4399174439131799, -3.5188569549087685, 0.6763558407018944 ], "yaxis": "y" }, { "customdata": [ [ "Vietnam" ], [ "Morocco" ], [ "Nepal" ], [ "Myanmar" ], [ "Venezuela, RB" ], [ "Mongolia" ], [ "Uzbekistan" ], [ "United Arab Emirates" ], [ "Nigeria" ], [ "Sudan" ], [ "St. Kitts and Nevis" ], [ "Sri Lanka" ], [ "Syrian Arab Republic" ], [ "Tajikistan" ], [ "Tanzania" ], [ "Togo" ], [ "Singapore" ], [ "Sierra Leone" ], [ "Mexico" ], [ "Niger" ], [ "Senegal" ], [ "Trinidad and Tobago" ], [ "Rwanda" ], [ "Turkmenistan" ], [ "Uganda" ], [ "Qatar" ], [ "Philippines" ], [ "Peru" ], [ "Paraguay" ], [ "Pakistan" ], [ "Oman" ], [ "Saudi Arabia" ], [ "Mauritius" ], [ "Arab World" ], [ "Chad" ], [ "Upper middle income" ], [ "Albania" ], [ "Angola" ], [ "Armenia" ], [ "Azerbaijan" ], [ "Bahamas, The" ], [ "Bahrain" ], [ "Bangladesh" ], [ "Belize" ], [ "Benin" ], [ "Brunei Darussalam" ], [ "Burkina Faso" ], [ "Burundi" ], [ "Cambodia" ], [ "Cameroon" ], [ "Sub-Saharan Africa (IDA & IBRD countries)" ], [ "Sub-Saharan Africa (excluding high income)" ], [ "Sub-Saharan Africa" ], [ "South Asia (IDA & IBRD)" ], [ "Caribbean small states" ], [ "Early-demographic dividend" ], [ "East Asia & Pacific (excluding high income)" ], [ "East Asia & Pacific (IDA & IBRD countries)" ], [ "Heavily indebted poor countries (HIPC)" ], [ "Late-demographic dividend" ], [ "Least developed countries: UN classification" ], [ "Central African Republic" ], [ "Low & middle income" ], [ "Lower middle income" ], [ "Middle East & North Africa" ], [ "Middle East & North Africa (excluding high income)" ], [ "Middle East & North Africa (IDA & IBRD countries)" ], [ "Middle income" ], [ "Pre-demographic dividend" ], [ "South Asia" ], [ "Low income" ], [ "Mauritania" ], [ "Zambia" ], [ "Comoros" ], [ "Yemen, Rep." ], [ "India" ], [ "Indonesia" ], [ "Iran, Islamic Rep." ], [ "Jamaica" ], [ "Kazakhstan" ], [ "Kenya" ], [ "Korea, Rep." ], [ "Kuwait" ], [ "Kyrgyz Republic" ], [ "Lao PDR" ], [ "Libya" ], [ "Madagascar" ], [ "Malaysia" ], [ "Mali" ], [ "China" ], [ "Guinea-Bissau" ], [ "Haiti" ], [ "Guatemala" ], [ "Congo, Dem. Rep." ], [ "Congo, Rep." ], [ "Cote d'Ivoire" ], [ "Cyprus" ], [ "Dominican Republic" ], [ "Ecuador" ], [ "Egypt, Arab Rep." ], [ "Equatorial Guinea" ], [ "Eritrea" ], [ "Ethiopia" ], [ "Fiji" ], [ "Gabon" ], [ "Gambia, The" ], [ "Georgia" ], [ "Ghana" ], [ "Guinea" ] ], "hovertemplate": "Cluster=Cluster 2
PCA1=%{x}
PCA2=%{y}
Feature=%{customdata[0]}", "legendgroup": "Cluster 2", "marker": { "color": "#00cc96", "opacity": 0.5, "symbol": "circle" }, "mode": "markers", "name": "Cluster 2", "orientation": "v", "showlegend": true, "textposition": "top center", "type": "scatter", "x": [ -6.838127133689372, -9.484297119000681, -7.481534537789983, -15.11526667768679, -8.0099704622005, -3.709945822543768, -4.343995899371722, -7.527412152427506, -12.093503451711781, -10.187893573210124, -5.982304037394747, -9.033280310482066, -8.34993440852866, -10.7401637209542, -6.704510490114223, -8.637772998311174, -10.783145859486595, -6.071121988048263, -4.862787780405474, -6.897017132517401, -7.128722124865843, -5.193398208285049, -4.536767858980432, -7.808119101950003, -7.410104286952265, -7.287596977267267, -10.375982305040118, -4.701430209018233, -3.3258792623976925, -13.274173398510674, -5.7830515182741244, -5.28060194247648, -7.183762362692117, -5.978111640505859, -8.739668478685987, -3.5565463908430774, -5.665968771045835, -6.1758384619265, -8.8877011054299, -11.990190347513366, -3.4727360186098393, -5.140448924477463, -12.279275148006182, -3.6782325952668047, -6.759047335826221, -5.553747628790428, -3.5927102273363105, -3.9114615341007193, -9.835625771928305, -11.816550848843821, -5.726460400774469, -5.733959228379499, -5.726460400774469, -11.717744407779506, -3.5335523602755807, -5.874889989411106, -7.338891894395104, -7.338891894395102, -6.779112802141312, -3.4865834565786367, -8.473369637629364, -8.328928193317836, -5.029770548401174, -10.12208829043547, -4.754617117667594, -5.6689371743232835, -5.6689371743232835, -5.002990850532889, -8.803685060464211, -11.717744407779506, -6.935487657597175, -8.209723823671501, -3.718335935066663, -7.131632386667641, -9.08405838904044, -11.64996360056128, -12.53819234803707, -6.29493372530749, -4.2763390860391794, -6.102007952138874, -7.505875796444623, -3.842269509289177, -5.756711635031171, -3.482951191502168, -11.157062106263886, -6.851591572318085, -6.318006421470661, -7.845046648174215, -4.999397273875959, -7.085967768499033, -10.52832969892298, -9.33543422069262, -7.2795343806145585, -12.749904411139479, -8.321722617418871, -9.491378675550758, -4.343442425602127, -7.780851195519921, -7.790551996098864, -7.622396289866976, -6.338709691007325, -9.859076847688465, -5.804870493017629, -4.139888379414401, -9.64411915861642, -5.068430173668127, -10.269095235769905, -5.329248830030671, -10.94554042621343 ], "xaxis": "x", "y": [ -2.1054224181312517, -0.6743398818959013, -0.837773061289016, -0.028339201058388965, 0.8228560527689587, 2.5255249894814966, 1.289877638426681, -0.36883114624597113, 0.31707827709695074, -1.5314700249093545, 2.123293254630933, 0.9368375328552409, 1.9279965762758615, -0.35646060776214494, -1.212219561328002, -0.4796246484431998, 0.3453398942374639, 2.053568828482675, -0.6462077405756084, -0.8646847381552383, -0.4874435073466264, -0.14709501047151036, -0.5039192162486804, 3.6314570197613825, -0.09849466670467585, 1.7017615075616381, 0.6894459850578996, 0.41004174217124434, -1.7654684443955149, 0.1519555139871271, 1.8771059208222196, -0.005353811348649069, 0.269614037976079, 0.060087273871189145, 2.0067347015121886, 0.014294049568387578, -0.2991488213101728, 1.0483999724431234, 0.2338035573351899, 0.6302439716252003, -0.4216974744697445, 1.0191811139862552, 0.9292942917451482, -1.553841067125939, 0.2722175266084948, 2.0371987618496568, -1.1581411492570501, -4.799628678285951, 1.320370034410966, 0.4203891767923587, 0.855292406191082, 0.8502496554360927, 0.855292406191082, 0.39968228249469306, 0.4273170989236, 0.5811594934368999, -0.9944962782369446, -0.9944962782369445, -0.5068844372590348, 0.03421941894983672, -0.09237404974594536, 0.5463133582843177, 0.055592760544055694, 0.47506045021065135, 0.4487598516474099, -0.3826301018191773, -0.3826301018191773, 0.06441920890858716, -0.17604580883604506, 0.39968228249469306, -0.5257808006280743, 2.0017941573755866, 2.117893316914127, 1.2418292146067682, 1.9725459159480585, 0.4387840994705089, 0.15993643922619083, -0.4299112429353996, 0.818304173500739, 1.4083207333161525, -0.6464163056969573, -2.5218613664014, 1.9781672804329198, -1.3346870062550664, 1.9136966118668464, -0.8158920238856169, 0.8693110544295612, 0.02881027663560581, 1.4976155459698757, -1.0585595028827899, 1.029264975053775, 2.009609502540951, -0.010123131376214865, -1.7875193250832506, -1.176103741966348, 0.8968873316434841, -1.129575189688764, -0.7418307711572959, -1.9995631693860632, 0.8432791724505591, -0.054473415667810145, 1.4370530974830713, -1.6067288163268219, 0.8117649007612818, -0.9218388760417181, -4.230259164337702, -0.2889516151239778, -1.758457647299846, -1.145121519851282 ], "yaxis": "y" }, { "customdata": [ [ "Nauru" ], [ "Tuvalu" ], [ "Marshall Islands" ] ], "hovertemplate": "Cluster=Cluster 3
PCA1=%{x}
PCA2=%{y}
Feature=%{customdata[0]}", "legendgroup": "Cluster 3", "marker": { "color": "#ab63fa", "opacity": 0.5, "symbol": "circle" }, "mode": "markers", "name": "Cluster 3", "orientation": "v", "showlegend": true, "textposition": "top center", "type": "scatter", "x": [ 32.54294615578061, 49.13614546484315, 55.908067724687456 ], "xaxis": "x", "y": [ 14.525514048370503, -4.779342617786482, 11.19015475718291 ], "yaxis": "y" } ], "layout": { "height": 600, "legend": { "title": { "text": "Cluster" }, "tracegroupgap": 0 }, "margin": { "t": 60 }, "plot_bgcolor": "rgb(240,240,240)", "template": { "data": { "bar": [ { "error_x": { "color": "#2a3f5f" }, "error_y": { "color": "#2a3f5f" }, "marker": { "line": { "color": "#E5ECF6", "width": 0.5 } }, "type": "bar" } ], "barpolar": [ { "marker": { "line": { "color": "#E5ECF6", "width": 0.5 } }, "type": "barpolar" } ], "carpet": [ { "aaxis": { "endlinecolor": "#2a3f5f", "gridcolor": "white", "linecolor": "white", "minorgridcolor": "white", "startlinecolor": "#2a3f5f" }, "baxis": { "endlinecolor": "#2a3f5f", "gridcolor": "white", "linecolor": "white", "minorgridcolor": "white", "startlinecolor": "#2a3f5f" }, "type": "carpet" } ], "choropleth": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "type": "choropleth" } ], "contour": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "contour" } ], "contourcarpet": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "type": "contourcarpet" } ], "heatmap": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "heatmap" } ], "heatmapgl": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "heatmapgl" } ], "histogram": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "histogram" } ], "histogram2d": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "histogram2d" } ], "histogram2dcontour": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "histogram2dcontour" } ], "mesh3d": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "type": "mesh3d" } ], "parcoords": [ { "line": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "parcoords" } ], "pie": [ { "automargin": true, "type": "pie" } ], "scatter": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatter" } ], "scatter3d": [ { "line": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatter3d" } ], "scattercarpet": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattercarpet" } ], "scattergeo": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattergeo" } ], "scattergl": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattergl" } ], "scattermapbox": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattermapbox" } ], "scatterpolar": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatterpolar" } ], "scatterpolargl": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatterpolargl" } ], "scatterternary": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatterternary" } ], "surface": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "surface" } ], "table": [ { "cells": { "fill": { "color": "#EBF0F8" }, "line": { "color": "white" } }, "header": { "fill": { "color": "#C8D4E3" }, "line": { "color": "white" } }, "type": "table" } ] }, "layout": { "annotationdefaults": { "arrowcolor": "#2a3f5f", "arrowhead": 0, "arrowwidth": 1 }, "coloraxis": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "colorscale": { "diverging": [ [ 0, "#8e0152" ], [ 0.1, "#c51b7d" ], [ 0.2, "#de77ae" ], [ 0.3, "#f1b6da" ], [ 0.4, "#fde0ef" ], [ 0.5, "#f7f7f7" ], [ 0.6, "#e6f5d0" ], [ 0.7, "#b8e186" ], [ 0.8, "#7fbc41" ], [ 0.9, "#4d9221" ], [ 1, "#276419" ] ], "sequential": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "sequentialminus": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ] }, "colorway": [ "#636efa", "#EF553B", "#00cc96", "#ab63fa", "#FFA15A", "#19d3f3", "#FF6692", "#B6E880", "#FF97FF", "#FECB52" ], "font": { "color": "#2a3f5f" }, "geo": { "bgcolor": "white", "lakecolor": "white", "landcolor": "#E5ECF6", "showlakes": true, "showland": true, "subunitcolor": "white" }, "hoverlabel": { "align": "left" }, "hovermode": "closest", "mapbox": { "style": "light" }, "paper_bgcolor": "white", "plot_bgcolor": "#E5ECF6", "polar": { "angularaxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" }, "bgcolor": "#E5ECF6", "radialaxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" } }, "scene": { "xaxis": { "backgroundcolor": "#E5ECF6", "gridcolor": "white", "gridwidth": 2, "linecolor": "white", "showbackground": true, "ticks": "", "zerolinecolor": "white" }, "yaxis": { "backgroundcolor": "#E5ECF6", "gridcolor": "white", "gridwidth": 2, "linecolor": "white", "showbackground": true, "ticks": "", "zerolinecolor": "white" }, "zaxis": { "backgroundcolor": "#E5ECF6", "gridcolor": "white", "gridwidth": 2, "linecolor": "white", "showbackground": true, "ticks": "", "zerolinecolor": "white" } }, "shapedefaults": { "line": { "color": "#2a3f5f" } }, "ternary": { "aaxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" }, "baxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" }, "bgcolor": "#E5ECF6", "caxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" } }, "title": { "x": 0.05 }, "xaxis": { "automargin": true, "gridcolor": "white", "linecolor": "white", "ticks": "", "title": { "standoff": 15 }, "zerolinecolor": "white", "zerolinewidth": 2 }, "yaxis": { "automargin": true, "gridcolor": "white", "linecolor": "white", "ticks": "", "title": { "standoff": 15 }, "zerolinecolor": "white", "zerolinewidth": 2 } } }, "title": { "text": "2D Cluster PCA Plot" }, "xaxis": { "anchor": "y", "domain": [ 0, 1 ], "title": { "text": "PCA1" } }, "yaxis": { "anchor": "x", "domain": [ 0, 1 ], "title": { "text": "PCA2" } } } }, "text/html": [ "
\n", " \n", " \n", "
\n", " \n", "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "plot_model(kmeans)" ] }, { "cell_type": "code", "execution_count": 9, "metadata": {}, "outputs": [ { "data": { "text/html": [ " \n", " " ] }, "metadata": {}, "output_type": "display_data" }, { "data": { "application/vnd.plotly.v1+json": { "config": { "plotlyServerURL": "https://plot.ly" }, "data": [ { "hovertemplate": "Cluster=Cluster 0
PCA1=%{x}
PCA2=%{y}
Label=%{text}", "legendgroup": "Cluster 0", "marker": { "color": "#636efa", "opacity": 0.5, "symbol": "circle" }, "mode": "markers+text", "name": "Cluster 0", "orientation": "v", "showlegend": true, "text": [ "Honduras", "Dominica", "Djibouti", "Samoa", "San Marino", "Sao Tome and Principe", "Colombia", "Chile", "Cabo Verde", "Solomon Islands", "Bulgaria", "South Africa", "Brazil", "Botswana", "Bolivia", "Bhutan", "Belarus", "Barbados", "St. Lucia", "St. Vincent and the Grenadines", "Russian Federation", "Suriname", "Romania", "Estonia", "Moldova", "Malawi", "Monaco", "Macedonia, FYR", "Lithuania", "Lebanon", "Latvia", "Montenegro", "Mozambique", "Namibia", "Jordan", "Israel", "Nicaragua", "Hungary", "Guyana", "Grenada", "Panama", "Papua New Guinea", "Poland", "El Salvador", "Argentina", "Seychelles", "Swaziland", "Small states", "Tonga", "Vanuatu", "Pacific island small states", "Other small states", "Tunisia", "East Asia & Pacific", "Turkey", "Ukraine", "Antigua and Barbuda", "Europe & Central Asia (IDA & IBRD countries)", "Latin America & the Caribbean (IDA & IBRD countries)", "Latin America & Caribbean (excluding high income)", "Latin America & Caribbean", "Europe & Central Asia (excluding high income)", "Thailand", "Uruguay", "Central Europe and the Baltics", "Algeria", "Andorra" ], "textposition": "top center", "type": "scatter", "x": [ 0.0523809767042203, -0.6963165842730611, 3.4963629024504157, 2.239179963842626, 2.996541555817924, -1.982879767134111, 5.269249366144288, -2.982481930004971, -0.5993207982455239, 6.323109784117417, 0.9043237858037494, -0.41674848743597237, -1.8325711391061783, -1.686965814851076, -0.8536612634039066, 2.8846255739114053, 3.0973104640228657, 0.5412716246977549, -1.7848088812854825, -0.5138111571569077, -0.36390899901084006, 0.040582767506344375, 0.7748426086098928, 3.7119153029666663, 4.882710147013893, 3.4211056709118535, -2.011887424842368, 4.811797590024579, 3.3977115784363083, -1.0594868777708515, -0.15053431117056518, 5.521664440212993, -1.5422464279154837, 2.475123168426273, 6.3793604633161785, 4.232365223943223, -0.4234591695205206, 6.877428452111309, 2.7628508172347273, -2.710078590714615, 6.182900164693898, 1.7357732814693132, 2.8915650781047106, 0.4067357117267071, 1.6549886134245433, -0.6367154259911892, 3.477841724858415, -2.8033488749931306, 0.688224693343187, -2.679774235079104, 2.521124354529939, -2.678082879662622, -2.260400608016421, 3.7321855099220653, -0.4374089529823035, 0.6817178664409335, -2.7904247938703306, 0.18827377624908267, -2.334515940063102, -2.0788610562518857, -2.0866140147954266, -0.5707423499700737, -0.13082493573547338, 3.753184859247307, 5.19653204627169, -2.5644440390142282, 4.883437593508746 ], "xaxis": "x", "y": [ -1.0061914536857364, 1.5305671961061875, -3.0016842207799743, -1.6875356484840207, -0.2740310411662722, 1.7913403986410694, 1.3359849927496932, 0.16091627846989195, 2.2543298469994255, -1.5474141205241485, 0.5730460663408711, 0.11355576223380467, -0.4294276179163997, -0.45382741503654317, -0.5170665696550727, 3.8566195969433834, 3.1486955568002464, -0.5683861330013134, 0.03129894274702836, -0.06757513689428422, 1.657514000735274, 4.7341680137885565, -1.2385442803297109, 1.264358496837327, 0.25926155597166634, -6.448804007521148, -0.4154591228405269, 3.387338823334593, 0.9531860986338618, 2.9931221367653293, 0.8003393682777394, 4.121262186928553, 1.9141130390493308, 0.5760168892285199, 0.7145199934098242, 1.70042370692386, -1.0957750164154723, 2.506866811798524, 2.1863935441044426, 1.9233874084159046, 0.6587191354538705, 1.377242221635593, 0.24184140169870277, -0.5631591457580744, 3.973969905401959, 3.142590570320148, -5.131259458682053, 1.503215156474529, 0.23043470667369545, -0.9892378763665283, 0.519385857240113, 1.7809406740110842, -0.8410240643570489, 0.9928267617964195, -1.8311715877970052, 1.1596543184112722, -0.6084592632583561, 0.7463734591250084, 0.13891010566730913, 0.12929841063543973, 0.09429419110350006, 0.6820820860708171, -3.706588405460558, -4.1531049826228665, 0.7126585487039374, -2.1296685616125792, -2.433941599042843 ], "yaxis": "y" }, { "hovertemplate": "Cluster=Cluster 1
PCA1=%{x}
PCA2=%{y}
Label=%{text}", "legendgroup": "Cluster 1", "marker": { "color": "#EF553B", "opacity": 0.5, "symbol": "circle" }, "mode": "markers+text", "name": "Cluster 1", "orientation": "v", "showlegend": true, "text": [ "Micronesia, Fed. Sts.", "Kiribati", "Finland", "France", "United Kingdom", "Germany", "Malta", "Greece", "Portugal", "Austria", "European Union", "Japan", "Australia", "Norway", "Netherlands", "United States", "Iceland", "Italy", "High income", "New Zealand", "Palau", "World", "Sweden", "Cuba", "Switzerland", "Slovak Republic", "Post-demographic dividend", "Serbia", "Spain", "Lesotho", "Europe & Central Asia", "Maldives", "Costa Rica", "Canada", "OECD members", "Croatia", "Ireland", "North America", "Czech Republic", "Denmark", "Euro area", "Belgium", "Slovenia", "Bosnia and Herzegovina", "Luxembourg" ], "textposition": "top center", "type": "scatter", "x": [ 28.0262695538832, 23.420927418009597, 10.726724560722625, 20.274410375468314, 12.929593082081045, 19.694842954903077, 7.314091778152733, 7.186477299903722, 11.14119297927542, 18.367344502907944, 14.943239114650703, 13.813253198680279, 8.675223471375858, 16.671662050148086, 14.383614043780405, 14.058971232804135, 15.946916758968193, 11.481683009232073, 13.138218186033123, 15.482183362753911, 13.858864478915562, 8.629457309687261, 18.38721009205912, 16.80945641164693, 11.69398831763859, 7.34823407837088, 13.808128624207797, 7.64716251857974, 10.043412321500618, 7.060532218142876, 13.234086657329984, 7.472880926088071, 10.217763125731786, 13.95454071375664, 13.114383027129241, 10.475304935117329, 7.171364571949278, 14.032324057252538, 10.210283019050978, 20.07095230754882, 15.823770054445614, 14.600979477284383, 11.318080992622432, 7.014345778510733, 10.746653539988584 ], "xaxis": "x", "y": [ -6.041878648963877, 1.823268170516312, -1.030749695397637, 0.5893161257926888, -2.2661386247236397, 1.2426452203194973, -1.6944069348771362, -1.361353560999246, -0.3178429143929311, 0.21312339635189195, -0.41168663466966343, -2.6865792296916515, -0.3696795752168184, 0.444650157035873, -6.075816075638619, -2.128293361440676, 2.1692216402280793, -1.2206793438921009, -1.1393786999588782, -4.743207341003983, 3.4424525494613616, 0.39461364528283294, -2.2006955984502494, -6.478083184227868, -1.83393087984684, 0.6291036683252442, -1.4098865373330882, -1.462348094961733, -0.9687378170947273, -6.859660089106432, 0.26416370258018984, -4.919417342361275, -1.1138186475250478, -0.6679680569801177, -1.2698155947760223, 0.35135324468989126, -0.25585213517749955, -2.0055644357724742, 0.9972888247732347, -2.057592902176683, -0.144709221609351, -1.8679602899905683, 0.4399174439131799, -3.5188569549087685, 0.6763558407018944 ], "yaxis": "y" }, { "hovertemplate": "Cluster=Cluster 2
PCA1=%{x}
PCA2=%{y}
Label=%{text}", "legendgroup": "Cluster 2", "marker": { "color": "#00cc96", "opacity": 0.5, "symbol": "circle" }, "mode": "markers+text", "name": "Cluster 2", "orientation": "v", "showlegend": true, "text": [ "Vietnam", "Morocco", "Nepal", "Myanmar", "Venezuela, RB", "Mongolia", "Uzbekistan", "United Arab Emirates", "Nigeria", "Sudan", "St. Kitts and Nevis", "Sri Lanka", "Syrian Arab Republic", "Tajikistan", "Tanzania", "Togo", "Singapore", "Sierra Leone", "Mexico", "Niger", "Senegal", "Trinidad and Tobago", "Rwanda", "Turkmenistan", "Uganda", "Qatar", "Philippines", "Peru", "Paraguay", "Pakistan", "Oman", "Saudi Arabia", "Mauritius", "Arab World", "Chad", "Upper middle income", "Albania", "Angola", "Armenia", "Azerbaijan", "Bahamas, The", "Bahrain", "Bangladesh", "Belize", "Benin", "Brunei Darussalam", "Burkina Faso", "Burundi", "Cambodia", "Cameroon", "Sub-Saharan Africa (IDA & IBRD countries)", "Sub-Saharan Africa (excluding high income)", "Sub-Saharan Africa", "South Asia (IDA & IBRD)", "Caribbean small states", "Early-demographic dividend", "East Asia & Pacific (excluding high income)", "East Asia & Pacific (IDA & IBRD countries)", "Heavily indebted poor countries (HIPC)", "Late-demographic dividend", "Least developed countries: UN classification", "Central African Republic", "Low & middle income", "Lower middle income", "Middle East & North Africa", "Middle East & North Africa (excluding high income)", "Middle East & North Africa (IDA & IBRD countries)", "Middle income", "Pre-demographic dividend", "South Asia", "Low income", "Mauritania", "Zambia", "Comoros", "Yemen, Rep.", "India", "Indonesia", "Iran, Islamic Rep.", "Jamaica", "Kazakhstan", "Kenya", "Korea, Rep.", "Kuwait", "Kyrgyz Republic", "Lao PDR", "Libya", "Madagascar", "Malaysia", "Mali", "China", "Guinea-Bissau", "Haiti", "Guatemala", "Congo, Dem. Rep.", "Congo, Rep.", "Cote d'Ivoire", "Cyprus", "Dominican Republic", "Ecuador", "Egypt, Arab Rep.", "Equatorial Guinea", "Eritrea", "Ethiopia", "Fiji", "Gabon", "Gambia, The", "Georgia", "Ghana", "Guinea" ], "textposition": "top center", "type": "scatter", "x": [ -6.838127133689372, -9.484297119000681, -7.481534537789983, -15.11526667768679, -8.0099704622005, -3.709945822543768, -4.343995899371722, -7.527412152427506, -12.093503451711781, -10.187893573210124, -5.982304037394747, -9.033280310482066, -8.34993440852866, -10.7401637209542, -6.704510490114223, -8.637772998311174, -10.783145859486595, -6.071121988048263, -4.862787780405474, -6.897017132517401, -7.128722124865843, -5.193398208285049, -4.536767858980432, -7.808119101950003, -7.410104286952265, -7.287596977267267, -10.375982305040118, -4.701430209018233, -3.3258792623976925, -13.274173398510674, -5.7830515182741244, -5.28060194247648, -7.183762362692117, -5.978111640505859, -8.739668478685987, -3.5565463908430774, -5.665968771045835, -6.1758384619265, -8.8877011054299, -11.990190347513366, -3.4727360186098393, -5.140448924477463, -12.279275148006182, -3.6782325952668047, -6.759047335826221, -5.553747628790428, -3.5927102273363105, -3.9114615341007193, -9.835625771928305, -11.816550848843821, -5.726460400774469, -5.733959228379499, -5.726460400774469, -11.717744407779506, -3.5335523602755807, -5.874889989411106, -7.338891894395104, -7.338891894395102, -6.779112802141312, -3.4865834565786367, -8.473369637629364, -8.328928193317836, -5.029770548401174, -10.12208829043547, -4.754617117667594, -5.6689371743232835, -5.6689371743232835, -5.002990850532889, -8.803685060464211, -11.717744407779506, -6.935487657597175, -8.209723823671501, -3.718335935066663, -7.131632386667641, -9.08405838904044, -11.64996360056128, -12.53819234803707, -6.29493372530749, -4.2763390860391794, -6.102007952138874, -7.505875796444623, -3.842269509289177, -5.756711635031171, -3.482951191502168, -11.157062106263886, -6.851591572318085, -6.318006421470661, -7.845046648174215, -4.999397273875959, -7.085967768499033, -10.52832969892298, -9.33543422069262, -7.2795343806145585, -12.749904411139479, -8.321722617418871, -9.491378675550758, -4.343442425602127, -7.780851195519921, -7.790551996098864, -7.622396289866976, -6.338709691007325, -9.859076847688465, -5.804870493017629, -4.139888379414401, -9.64411915861642, -5.068430173668127, -10.269095235769905, -5.329248830030671, -10.94554042621343 ], "xaxis": "x", "y": [ -2.1054224181312517, -0.6743398818959013, -0.837773061289016, -0.028339201058388965, 0.8228560527689587, 2.5255249894814966, 1.289877638426681, -0.36883114624597113, 0.31707827709695074, -1.5314700249093545, 2.123293254630933, 0.9368375328552409, 1.9279965762758615, -0.35646060776214494, -1.212219561328002, -0.4796246484431998, 0.3453398942374639, 2.053568828482675, -0.6462077405756084, -0.8646847381552383, -0.4874435073466264, -0.14709501047151036, -0.5039192162486804, 3.6314570197613825, -0.09849466670467585, 1.7017615075616381, 0.6894459850578996, 0.41004174217124434, -1.7654684443955149, 0.1519555139871271, 1.8771059208222196, -0.005353811348649069, 0.269614037976079, 0.060087273871189145, 2.0067347015121886, 0.014294049568387578, -0.2991488213101728, 1.0483999724431234, 0.2338035573351899, 0.6302439716252003, -0.4216974744697445, 1.0191811139862552, 0.9292942917451482, -1.553841067125939, 0.2722175266084948, 2.0371987618496568, -1.1581411492570501, -4.799628678285951, 1.320370034410966, 0.4203891767923587, 0.855292406191082, 0.8502496554360927, 0.855292406191082, 0.39968228249469306, 0.4273170989236, 0.5811594934368999, -0.9944962782369446, -0.9944962782369445, -0.5068844372590348, 0.03421941894983672, -0.09237404974594536, 0.5463133582843177, 0.055592760544055694, 0.47506045021065135, 0.4487598516474099, -0.3826301018191773, -0.3826301018191773, 0.06441920890858716, -0.17604580883604506, 0.39968228249469306, -0.5257808006280743, 2.0017941573755866, 2.117893316914127, 1.2418292146067682, 1.9725459159480585, 0.4387840994705089, 0.15993643922619083, -0.4299112429353996, 0.818304173500739, 1.4083207333161525, -0.6464163056969573, -2.5218613664014, 1.9781672804329198, -1.3346870062550664, 1.9136966118668464, -0.8158920238856169, 0.8693110544295612, 0.02881027663560581, 1.4976155459698757, -1.0585595028827899, 1.029264975053775, 2.009609502540951, -0.010123131376214865, -1.7875193250832506, -1.176103741966348, 0.8968873316434841, -1.129575189688764, -0.7418307711572959, -1.9995631693860632, 0.8432791724505591, -0.054473415667810145, 1.4370530974830713, -1.6067288163268219, 0.8117649007612818, -0.9218388760417181, -4.230259164337702, -0.2889516151239778, -1.758457647299846, -1.145121519851282 ], "yaxis": "y" }, { "hovertemplate": "Cluster=Cluster 3
PCA1=%{x}
PCA2=%{y}
Label=%{text}", "legendgroup": "Cluster 3", "marker": { "color": "#ab63fa", "opacity": 0.5, "symbol": "circle" }, "mode": "markers+text", "name": "Cluster 3", "orientation": "v", "showlegend": true, "text": [ "Nauru", "Tuvalu", "Marshall Islands" ], "textposition": "top center", "type": "scatter", "x": [ 32.54294615578061, 49.13614546484315, 55.908067724687456 ], "xaxis": "x", "y": [ 14.525514048370503, -4.779342617786482, 11.19015475718291 ], "yaxis": "y" } ], "layout": { "height": 600, "legend": { "title": { "text": "Cluster" }, "tracegroupgap": 0 }, "margin": { "t": 60 }, "plot_bgcolor": "rgb(240,240,240)", "template": { "data": { "bar": [ { "error_x": { "color": "#2a3f5f" }, "error_y": { "color": "#2a3f5f" }, "marker": { "line": { "color": "#E5ECF6", "width": 0.5 } }, "type": "bar" } ], "barpolar": [ { "marker": { "line": { "color": "#E5ECF6", "width": 0.5 } }, "type": "barpolar" } ], "carpet": [ { "aaxis": { "endlinecolor": "#2a3f5f", "gridcolor": "white", "linecolor": "white", "minorgridcolor": "white", "startlinecolor": "#2a3f5f" }, "baxis": { "endlinecolor": "#2a3f5f", "gridcolor": "white", "linecolor": "white", "minorgridcolor": "white", "startlinecolor": "#2a3f5f" }, "type": "carpet" } ], "choropleth": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "type": "choropleth" } ], "contour": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "contour" } ], "contourcarpet": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "type": "contourcarpet" } ], "heatmap": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "heatmap" } ], "heatmapgl": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "heatmapgl" } ], "histogram": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "histogram" } ], "histogram2d": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "histogram2d" } ], "histogram2dcontour": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "histogram2dcontour" } ], "mesh3d": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "type": "mesh3d" } ], "parcoords": [ { "line": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "parcoords" } ], "pie": [ { "automargin": true, "type": "pie" } ], "scatter": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatter" } ], "scatter3d": [ { "line": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatter3d" } ], "scattercarpet": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattercarpet" } ], "scattergeo": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattergeo" } ], "scattergl": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattergl" } ], "scattermapbox": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattermapbox" } ], "scatterpolar": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatterpolar" } ], "scatterpolargl": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatterpolargl" } ], "scatterternary": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatterternary" } ], "surface": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "surface" } ], "table": [ { "cells": { "fill": { "color": "#EBF0F8" }, "line": { "color": "white" } }, "header": { "fill": { "color": "#C8D4E3" }, "line": { "color": "white" } }, "type": "table" } ] }, "layout": { "annotationdefaults": { "arrowcolor": "#2a3f5f", "arrowhead": 0, "arrowwidth": 1 }, "coloraxis": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "colorscale": { "diverging": [ [ 0, "#8e0152" ], [ 0.1, "#c51b7d" ], [ 0.2, "#de77ae" ], [ 0.3, "#f1b6da" ], [ 0.4, "#fde0ef" ], [ 0.5, "#f7f7f7" ], [ 0.6, "#e6f5d0" ], [ 0.7, "#b8e186" ], [ 0.8, "#7fbc41" ], [ 0.9, "#4d9221" ], [ 1, "#276419" ] ], "sequential": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "sequentialminus": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ] }, "colorway": [ "#636efa", "#EF553B", "#00cc96", "#ab63fa", "#FFA15A", "#19d3f3", "#FF6692", "#B6E880", "#FF97FF", "#FECB52" ], "font": { "color": "#2a3f5f" }, "geo": { "bgcolor": "white", "lakecolor": "white", "landcolor": "#E5ECF6", "showlakes": true, "showland": true, "subunitcolor": "white" }, "hoverlabel": { "align": "left" }, "hovermode": "closest", "mapbox": { "style": "light" }, "paper_bgcolor": "white", "plot_bgcolor": "#E5ECF6", "polar": { "angularaxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" }, "bgcolor": "#E5ECF6", "radialaxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" } }, "scene": { "xaxis": { "backgroundcolor": "#E5ECF6", "gridcolor": "white", "gridwidth": 2, "linecolor": "white", "showbackground": true, "ticks": "", "zerolinecolor": "white" }, "yaxis": { "backgroundcolor": "#E5ECF6", "gridcolor": "white", "gridwidth": 2, "linecolor": "white", "showbackground": true, "ticks": "", "zerolinecolor": "white" }, "zaxis": { "backgroundcolor": "#E5ECF6", "gridcolor": "white", "gridwidth": 2, "linecolor": "white", "showbackground": true, "ticks": "", "zerolinecolor": "white" } }, "shapedefaults": { "line": { "color": "#2a3f5f" } }, "ternary": { "aaxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" }, "baxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" }, "bgcolor": "#E5ECF6", "caxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" } }, "title": { "x": 0.05 }, "xaxis": { "automargin": true, "gridcolor": "white", "linecolor": "white", "ticks": "", "title": { "standoff": 15 }, "zerolinecolor": "white", "zerolinewidth": 2 }, "yaxis": { "automargin": true, "gridcolor": "white", "linecolor": "white", "ticks": "", "title": { "standoff": 15 }, "zerolinecolor": "white", "zerolinewidth": 2 } } }, "title": { "text": "2D Cluster PCA Plot" }, "xaxis": { "anchor": "y", "domain": [ 0, 1 ], "title": { "text": "PCA1" } }, "yaxis": { "anchor": "x", "domain": [ 0, 1 ], "title": { "text": "PCA2" } } } }, "text/html": [ "
\n", " \n", " \n", "
\n", " \n", "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "plot_model(kmeans, feature = 'Country Name', label=True)" ] }, { "cell_type": "code", "execution_count": 10, "metadata": {}, "outputs": [ { "data": { "text/html": [ " \n", " " ] }, "metadata": {}, "output_type": "display_data" }, { "data": { "application/vnd.plotly.v1+json": { "config": { "plotlyServerURL": "https://plot.ly" }, "data": [ { "customdata": [ [ "Honduras" ], [ "Dominica" ], [ "Djibouti" ], [ "Samoa" ], [ "San Marino" ], [ "Sao Tome and Principe" ], [ "Colombia" ], [ "Chile" ], [ "Cabo Verde" ], [ "Solomon Islands" ], [ "Bulgaria" ], [ "South Africa" ], [ "Brazil" ], [ "Botswana" ], [ "Bolivia" ], [ "Bhutan" ], [ "Belarus" ], [ "Barbados" ], [ "St. Lucia" ], [ "St. Vincent and the Grenadines" ], [ "Russian Federation" ], [ "Suriname" ], [ "Romania" ], [ "Estonia" ], [ "Moldova" ], [ "Malawi" ], [ "Monaco" ], [ "Macedonia, FYR" ], [ "Lithuania" ], [ "Lebanon" ], [ "Latvia" ], [ "Montenegro" ], [ "Mozambique" ], [ "Namibia" ], [ "Jordan" ], [ "Israel" ], [ "Nicaragua" ], [ "Hungary" ], [ "Guyana" ], [ "Grenada" ], [ "Panama" ], [ "Papua New Guinea" ], [ "Poland" ], [ "El Salvador" ], [ "Argentina" ], [ "Seychelles" ], [ "Swaziland" ], [ "Small states" ], [ "Tonga" ], [ "Vanuatu" ], [ "Pacific island small states" ], [ "Other small states" ], [ "Tunisia" ], [ "East Asia & Pacific" ], [ "Turkey" ], [ "Ukraine" ], [ "Antigua and Barbuda" ], [ "Europe & Central Asia (IDA & IBRD countries)" ], [ "Latin America & the Caribbean (IDA & IBRD countries)" ], [ "Latin America & Caribbean (excluding high income)" ], [ "Latin America & Caribbean" ], [ "Europe & Central Asia (excluding high income)" ], [ "Thailand" ], [ "Uruguay" ], [ "Central Europe and the Baltics" ], [ "Algeria" ], [ "Andorra" ] ], "hovertemplate": "Cluster=Cluster 0
0=%{x}
1=%{y}
2=%{z}
Feature=%{customdata[0]}", "legendgroup": "Cluster 0", "marker": { "color": "#636efa", "opacity": 0.7, "symbol": "circle" }, "mode": "markers", "name": "Cluster 0", "scene": "scene", "showlegend": true, "type": "scatter3d", "x": [ -126.78446960449219, -32.37543487548828, -19.36821746826172, -18.89223289489746, 144.3787078857422, -73.21328735351562, -42.71407699584961, -27.84712028503418, 74.90287780761719, 11.832152366638184, -87.12774658203125, 133.77809143066406, -90.86527252197266, -109.42573547363281, -88.20365142822266, -76.91995239257812, -91.02154541015625, -32.2028694152832, -27.2868595123291, -57.80535125732422, -108.08625030517578, -80.39252471923828, -107.40230560302734, -133.89035034179688, -124.98924255371094, 8.11201000213623, -66.80313873291016, -78.32198333740234, -114.07943725585938, -2.4837732315063477, -116.26299285888672, -40.849178314208984, -66.57929992675781, -14.147893905639648, -37.86670684814453, -122.67259979248047, -52.52400588989258, -70.49372100830078, -101.6419448852539, -31.854501724243164, 22.719388961791992, -106.13804626464844, -65.93650817871094, -70.15404510498047, -66.82675170898438, 7.206932067871094, -45.80060577392578, -44.320133209228516, -124.49557495117188, -91.65505981445312, -43.67847442626953, -27.566049575805664, -50.18693161010742, -70.46929168701172, -45.12035369873047, -40.63631820678711, -59.46231460571289, 104.69760131835938, 102.19699096679688, -79.22418975830078, -79.26667785644531, -88.33302307128906, -9.479289054870605, -42.430625915527344, 154.92051696777344, -60.429378509521484, 82.88695526123047 ], "y": [ 43.15277099609375, -10.89283275604248, -24.421171188354492, -92.1946029663086, 129.49444580078125, 41.3981819152832, -23.111337661743164, 44.28285217285156, -116.93305206298828, -15.740466117858887, -21.407833099365234, -48.601226806640625, 45.268795013427734, 74.9503173828125, 33.87964630126953, -37.77450942993164, -60.04612350463867, -47.31461715698242, 19.260692596435547, 24.68792724609375, -110.743408203125, -52.72629928588867, -3.811255693435669, -72.65250396728516, -44.520538330078125, -30.29142951965332, 19.481428146362305, -32.62969970703125, -39.35870361328125, -23.85220718383789, 20.2210750579834, -140.74462890625, 7.367926120758057, -64.85199737548828, -86.46775817871094, -39.187164306640625, -4.034049987792969, -87.078857421875, -74.50845336914062, -10.110224723815918, -60.68466567993164, -2.7893710136413574, -45.02962112426758, 2.2084994316101074, -71.01929473876953, -18.65491485595703, -85.18721008300781, -30.196495056152344, 21.637052536010742, 29.188814163208008, -21.467952728271484, -10.298230171203613, 37.224632263183594, 72.28972625732422, 19.837854385375977, -39.084259033203125, 64.85214233398438, -100.50811004638672, -79.002685546875, 52.88836669921875, 21.779090881347656, 2.4989407062530518, 23.948307037353516, -19.20369529724121, 57.39501953125, 62.94207000732422, -137.23312377929688 ], "z": [ 29.807958602905273, -25.67173957824707, 124.5315170288086, -40.57310485839844, -34.887657165527344, -89.9435806274414, 83.33155822753906, -17.19514274597168, 12.633121490478516, 96.05663299560547, 16.357215881347656, -13.559488296508789, 48.78775405883789, -8.385662078857422, -34.03363800048828, -27.457378387451172, 6.517147064208984, -44.499725341796875, 18.380664825439453, -9.462685585021973, 38.46765899658203, -66.57456970214844, 46.36784744262695, 14.267641067504883, -92.97856140136719, 149.65750122070312, 61.128910064697266, 80.01795959472656, -23.70490074157715, 0.8011439442634583, -3.233625888824463, -68.75605010986328, -83.13336181640625, -13.865184783935547, 9.562644004821777, 14.643394470214844, 7.726006031036377, 26.00888442993164, -27.922414779663086, -113.27445220947266, 7.004746913909912, -73.03219604492188, 37.03928756713867, -40.196353912353516, -25.442922592163086, 32.239994049072266, -72.35624694824219, -86.91000366210938, -46.444637298583984, 87.101806640625, 41.75047302246094, -72.31778717041016, 36.9173469543457, -45.84349822998047, 112.41606903076172, 3.3442492485046387, 52.71244812011719, 34.306846618652344, -16.136449813842773, 13.833440780639648, 25.74953842163086, -8.760519981384277, 121.27063751220703, 155.79559326171875, 1.765377163887024, 97.37370300292969, 71.88475799560547 ] }, { "customdata": [ [ "Micronesia, Fed. Sts." ], [ "Kiribati" ], [ "Finland" ], [ "France" ], [ "United Kingdom" ], [ "Germany" ], [ "Malta" ], [ "Greece" ], [ "Portugal" ], [ "Austria" ], [ "European Union" ], [ "Japan" ], [ "Australia" ], [ "Norway" ], [ "Netherlands" ], [ "United States" ], [ "Iceland" ], [ "Italy" ], [ "High income" ], [ "New Zealand" ], [ "Palau" ], [ "World" ], [ "Sweden" ], [ "Cuba" ], [ "Switzerland" ], [ "Slovak Republic" ], [ "Post-demographic dividend" ], [ "Serbia" ], [ "Spain" ], [ "Lesotho" ], [ "Europe & Central Asia" ], [ "Maldives" ], [ "Costa Rica" ], [ "Canada" ], [ "OECD members" ], [ "Croatia" ], [ "Ireland" ], [ "North America" ], [ "Czech Republic" ], [ "Denmark" ], [ "Euro area" ], [ "Belgium" ], [ "Slovenia" ], [ "Bosnia and Herzegovina" ], [ "Luxembourg" ] ], "hovertemplate": "Cluster=Cluster 1
0=%{x}
1=%{y}
2=%{z}
Feature=%{customdata[0]}", "legendgroup": "Cluster 1", "marker": { "color": "#EF553B", "opacity": 0.7, "symbol": "circle" }, "mode": "markers", "name": "Cluster 1", "scene": "scene", "showlegend": true, "type": "scatter3d", "x": [ -88.11402130126953, -77.82678985595703, -3.2598507404327393, 69.15101623535156, 62.150917053222656, -62.651519775390625, 39.013641357421875, -165.47891235351562, 28.766172409057617, -16.432161331176758, -45.083587646484375, 3.839843511581421, 133.85647583007812, 119.4168472290039, -0.717315137386322, -20.354429244995117, -46.77958297729492, 46.70835876464844, -121.00655364990234, -7.714614391326904, -49.09074020385742, -0.33314478397369385, -23.45708465576172, -70.70803833007812, -28.60447883605957, 146.1763153076172, -61.69521713256836, 33.783409118652344, -8.393195152282715, -54.229312896728516, 35.87360763549805, -15.129674911499023, 14.839582443237305, -95.42417907714844, -92.32735443115234, -24.840633392333984, -66.70491790771484, 27.943151473999023, 13.072808265686035, 107.1348648071289, -0.721197783946991, 124.7112808227539, 57.04808044433594, -78.05878448486328, -6.431966304779053 ], "y": [ -126.9201431274414, -156.75404357910156, -79.89331817626953, 144.38970947265625, -85.13299560546875, -158.81649780273438, -105.92500305175781, 21.67371940612793, -54.23844528198242, -88.68746185302734, -124.76695251464844, -148.7276611328125, 84.49352264404297, -59.72150421142578, -131.11471557617188, -128.93605041503906, -126.6605224609375, -49.89215850830078, -48.41311264038086, -154.22496032714844, -157.38629150390625, -86.60478973388672, -167.145263671875, -124.84716033935547, -90.49507904052734, 38.930938720703125, -98.65646362304688, -74.273193359375, -54.480194091796875, -65.10554504394531, -100.59464263916016, -76.20425415039062, -88.88796997070312, -80.30970764160156, -76.20366668701172, -70.443115234375, -111.35395050048828, -130.28440856933594, -63.591773986816406, -23.377288818359375, -114.7765121459961, 70.27677154541016, -73.69287109375, -70.50360870361328, -107.39778900146484 ], "z": [ -53.52519226074219, -26.66226577758789, 104.28823852539062, 101.33555603027344, 72.46026611328125, 11.565646171569824, 105.19086456298828, -1.5903586149215698, 87.3612289428711, -116.48747253417969, 41.51200866699219, 47.47815704345703, 38.59931564331055, 38.0098876953125, 1.9415256977081299, 86.91291809082031, -9.291139602661133, 58.44478988647461, 78.07772064208984, -24.594953536987305, 65.52398681640625, 23.265583038330078, 18.08367347717285, 104.923583984375, 83.19931030273438, 39.76939392089844, 70.93531036376953, 122.31250762939453, 77.23844909667969, 124.7575454711914, 45.915184020996094, 147.10231018066406, 75.09368896484375, 101.19279479980469, 64.2965087890625, 49.403751373291016, -106.01885986328125, 26.022544860839844, 47.3941535949707, 22.0814266204834, -82.36180114746094, 91.43154907226562, 31.820758819580078, -111.32955932617188, 52.63199234008789 ] }, { "customdata": [ [ "Vietnam" ], [ "Morocco" ], [ "Nepal" ], [ "Myanmar" ], [ "Venezuela, RB" ], [ "Mongolia" ], [ "Uzbekistan" ], [ "United Arab Emirates" ], [ "Nigeria" ], [ "Sudan" ], [ "St. Kitts and Nevis" ], [ "Sri Lanka" ], [ "Syrian Arab Republic" ], [ "Tajikistan" ], [ "Tanzania" ], [ "Togo" ], [ "Singapore" ], [ "Sierra Leone" ], [ "Mexico" ], [ "Niger" ], [ "Senegal" ], [ "Trinidad and Tobago" ], [ "Rwanda" ], [ "Turkmenistan" ], [ "Uganda" ], [ "Qatar" ], [ "Philippines" ], [ "Peru" ], [ "Paraguay" ], [ "Pakistan" ], [ "Oman" ], [ "Saudi Arabia" ], [ "Mauritius" ], [ "Arab World" ], [ "Chad" ], [ "Upper middle income" ], [ "Albania" ], [ "Angola" ], [ "Armenia" ], [ "Azerbaijan" ], [ "Bahamas, The" ], [ "Bahrain" ], [ "Bangladesh" ], [ "Belize" ], [ "Benin" ], [ "Brunei Darussalam" ], [ "Burkina Faso" ], [ "Burundi" ], [ "Cambodia" ], [ "Cameroon" ], [ "Sub-Saharan Africa (IDA & IBRD countries)" ], [ "Sub-Saharan Africa (excluding high income)" ], [ "Sub-Saharan Africa" ], [ "South Asia (IDA & IBRD)" ], [ "Caribbean small states" ], [ "Early-demographic dividend" ], [ "East Asia & Pacific (excluding high income)" ], [ "East Asia & Pacific (IDA & IBRD countries)" ], [ "Heavily indebted poor countries (HIPC)" ], [ "Late-demographic dividend" ], [ "Least developed countries: UN classification" ], [ "Central African Republic" ], [ "Low & middle income" ], [ "Lower middle income" ], [ "Middle East & North Africa" ], [ "Middle East & North Africa (excluding high income)" ], [ "Middle East & North Africa (IDA & IBRD countries)" ], [ "Middle income" ], [ "Pre-demographic dividend" ], [ "South Asia" ], [ "Low income" ], [ "Mauritania" ], [ "Zambia" ], [ "Comoros" ], [ "Yemen, Rep." ], [ "India" ], [ "Indonesia" ], [ "Iran, Islamic Rep." ], [ "Jamaica" ], [ "Kazakhstan" ], [ "Kenya" ], [ "Korea, Rep." ], [ "Kuwait" ], [ "Kyrgyz Republic" ], [ "Lao PDR" ], [ "Libya" ], [ "Madagascar" ], [ "Malaysia" ], [ "Mali" ], [ "China" ], [ "Guinea-Bissau" ], [ "Haiti" ], [ "Guatemala" ], [ "Congo, Dem. Rep." ], [ "Congo, Rep." ], [ "Cote d'Ivoire" ], [ "Cyprus" ], [ "Dominican Republic" ], [ "Ecuador" ], [ "Egypt, Arab Rep." ], [ "Equatorial Guinea" ], [ "Eritrea" ], [ "Ethiopia" ], [ "Fiji" ], [ "Gabon" ], [ "Gambia, The" ], [ "Georgia" ], [ "Ghana" ], [ "Guinea" ] ], "hovertemplate": "Cluster=Cluster 2
0=%{x}
1=%{y}
2=%{z}
Feature=%{customdata[0]}", "legendgroup": "Cluster 2", "marker": { "color": "#00cc96", "opacity": 0.7, "symbol": "circle" }, "mode": "markers", "name": "Cluster 2", "scene": "scene", "showlegend": true, "type": "scatter3d", "x": [ 35.51774215698242, 49.959922790527344, 97.00627136230469, -8.974799156188965, 1.756780743598938, 110.67847442626953, 38.3427848815918, 97.50794982910156, 21.036909103393555, 77.29632568359375, -7.557363510131836, 22.124521255493164, 98.8487777709961, 89.51163482666016, 63.263587951660156, 104.09825897216797, 57.12544631958008, -44.59601593017578, -48.0516471862793, 60.092220306396484, -80.48674774169922, -42.8533935546875, -16.86318016052246, 80.9300308227539, 48.83266830444336, -28.058794021606445, 87.8804702758789, 20.00042724609375, -82.54764556884766, 12.751977920532227, 62.68305969238281, 10.184957504272461, 49.835636138916016, 39.43074417114258, 60.842079162597656, -46.23152542114258, 12.279155731201172, 143.78453063964844, 50.9847526550293, 21.534423828125, -19.452762603759766, 66.55541229248047, 92.21378326416016, -26.787494659423828, 78.06719207763672, 136.4708251953125, 47.55731964111328, -1.3944733142852783, 43.80042266845703, 77.67610931396484, 42.80725860595703, 68.00390625, 46.35131072998047, 16.59248161315918, 4.2512593269348145, 91.16024780273438, 61.532997131347656, 27.364946365356445, 55.3148307800293, 10.863265991210938, -159.91925048828125, 53.54957962036133, 34.45584487915039, 39.28474807739258, 29.621797561645508, -27.884536743164062, 56.14976501464844, 2.3209922313690186, 96.68293762207031, 54.63113021850586, 30.952590942382812, 2.4865574836730957, -38.24899673461914, 88.69066619873047, 29.865819931030273, 54.2628288269043, -18.805095672607422, 42.29069900512695, 44.05807876586914, 63.83021926879883, 70.3000717163086, -10.175737380981445, 15.66401195526123, -21.97629737854004, 95.2664566040039, 35.04226303100586, 87.1489486694336, -151.65048217773438, -1.678355097770691, 35.30405044555664, 78.0763931274414, 66.00018310546875, 89.95539093017578, 126.9373550415039, 77.37574005126953, 119.95099639892578, -30.056663513183594, 70.9675521850586, 50.80670928955078, 37.00065612792969, 103.53599548339844, 43.948814392089844, 16.377910614013672, 130.62411499023438, 48.151432037353516, 1.428124189376831, 87.9597396850586, -37.089603424072266, 84.31513214111328 ], "y": [ 86.11861419677734, 151.85350036621094, 42.53098678588867, 153.9085235595703, 72.39804077148438, -37.44678497314453, -28.3231201171875, 46.3528938293457, 116.9840316772461, 160.2217254638672, 26.292734146118164, 66.28407287597656, -24.869197845458984, 9.763477325439453, 9.357078552246094, 50.154151916503906, 106.84445190429688, 64.37794494628906, 115.95806121826172, 45.53333282470703, 1.5635287761688232, 114.46210479736328, 83.75853729248047, 50.861351013183594, 41.69894790649414, 70.961669921875, 92.66638946533203, -30.671457290649414, 83.8593521118164, 127.13004302978516, -32.8255615234375, -0.004149935208261013, 48.83694839477539, 3.0405452251434326, 67.02842712402344, 71.17982482910156, 24.160755157470703, -2.866029977798462, 6.350869178771973, -45.496646881103516, 57.02355194091797, -68.80757141113281, 114.5761947631836, 68.81050109863281, 18.279218673706055, -11.911029815673828, -1.9755653142929077, 81.80469512939453, 158.60107421875, 85.61334991455078, -102.58647155761719, -98.5969009399414, -125.60010528564453, 126.72012329101562, -43.857913970947266, 6.927072525024414, 42.797386169433594, -150.87738037109375, -6.679513454437256, -9.826323509216309, -20.47049331665039, 49.222068786621094, -76.31359100341797, 97.8327865600586, -57.29827880859375, 134.44325256347656, -44.07075881958008, 83.14803314208984, -71.80452728271484, 89.81132507324219, 53.70758819580078, 82.70372009277344, 26.26255226135254, 13.54741096496582, 59.91390609741211, 125.4966049194336, 122.30960845947266, 17.092138290405273, -59.853797912597656, -7.135588645935059, 61.16280746459961, 96.15939331054688, 1.4561012983322144, 35.749420166015625, 108.18864440917969, 43.08784866333008, -13.24064826965332, -57.43830490112305, 32.07301712036133, 59.270713806152344, 138.17596435546875, 113.50666046142578, -15.672411918640137, 80.99279022216797, 95.73780059814453, -48.45591735839844, 95.77444458007812, 75.1473617553711, 95.57159423828125, 27.90198516845703, 32.78878402709961, 100.00543975830078, 22.384517669677734, 5.624805927276611, 126.52156066894531, 116.10196685791016, 138.16004943847656, 103.63263702392578, 116.77137756347656 ], "z": [ 66.11446380615234, -7.878054141998291, 35.765384674072266, -32.94074630737305, -58.590911865234375, 85.04874420166016, -118.80330657958984, -38.865291595458984, -14.068526268005371, 15.291756629943848, -132.68995666503906, -91.11685943603516, -118.00121307373047, 111.69256591796875, 23.590957641601562, -0.6745773553848267, -3.916962146759033, -137.80848693847656, 61.876129150390625, 8.923430442810059, -133.58795166015625, 0.3559304475784302, -19.630861282348633, -146.30206298828125, -39.74351119995117, -93.055419921875, -17.991783142089844, -49.04780578613281, 82.7301025390625, -45.30446243286133, 10.661585807800293, -31.399181365966797, 122.66265869140625, -55.47542953491211, -119.45091247558594, 14.388965606689453, 4.403152942657471, -75.97978210449219, 141.58326721191406, -160.31509399414062, 38.06013107299805, -67.57469177246094, -49.09112548828125, 74.23567962646484, -23.329309463500977, 54.53202819824219, 74.52362823486328, 111.16339111328125, -74.96077728271484, -63.403987884521484, -63.87319564819336, -39.219146728515625, -38.194828033447266, -80.41859436035156, -91.44154357910156, 59.5721549987793, 52.12397384643555, 100.87918090820312, -24.58880043029785, -87.10834503173828, -40.81977844238281, -78.04425811767578, -32.282493591308594, -64.45409393310547, -62.914947509765625, 30.32049560546875, -31.711257934570312, 18.049297332763672, -106.74824523925781, -34.496070861816406, -10.772473335266113, -125.51321411132812, -85.4994888305664, -118.17176055908203, -130.54376220703125, -42.73122024536133, -62.93001937866211, -8.273773193359375, -98.51644134521484, -93.38803100585938, 85.25978088378906, 73.7366714477539, -151.66749572753906, 71.36871337890625, -92.11683654785156, 85.09620666503906, -58.887489318847656, -52.473731994628906, -54.95683670043945, 43.04727554321289, -78.57160949707031, -122.99945068359375, -20.77290916442871, -53.3505973815918, 78.65189361572266, -72.87665557861328, 42.01951217651367, 38.67578887939453, 97.65454864501953, -100.09162139892578, -72.15169525146484, -98.67756652832031, 45.46915054321289, -27.213851928710938, 30.882976531982422, 98.3547592163086, -16.266990661621094, 116.29129028320312, 24.138912200927734 ] }, { "customdata": [ [ "Nauru" ], [ "Tuvalu" ], [ "Marshall Islands" ] ], "hovertemplate": "Cluster=Cluster 3
0=%{x}
1=%{y}
2=%{z}
Feature=%{customdata[0]}", "legendgroup": "Cluster 3", "marker": { "color": "#ab63fa", "opacity": 0.7, "symbol": "circle" }, "mode": "markers", "name": "Cluster 3", "scene": "scene", "showlegend": true, "type": "scatter3d", "x": [ -96.54039001464844, 89.89451599121094, -126.18791198730469 ], "y": [ -134.3475341796875, -74.43345642089844, -121.75009155273438 ], "z": [ -3.933764934539795, 119.6111068725586, -26.51927947998047 ] } ], "layout": { "height": 800, "legend": { "title": { "text": "Cluster" }, "tracegroupgap": 0 }, "scene": { "domain": { "x": [ 0, 1 ], "y": [ 0, 1 ] }, "xaxis": { "title": { "text": "0" } }, "yaxis": { "title": { "text": "1" } }, "zaxis": { "title": { "text": "2" } } }, "template": { "data": { "bar": [ { "error_x": { "color": "#2a3f5f" }, "error_y": { "color": "#2a3f5f" }, "marker": { "line": { "color": "#E5ECF6", "width": 0.5 } }, "type": "bar" } ], "barpolar": [ { "marker": { "line": { "color": "#E5ECF6", "width": 0.5 } }, "type": "barpolar" } ], "carpet": [ { "aaxis": { "endlinecolor": "#2a3f5f", "gridcolor": "white", "linecolor": "white", "minorgridcolor": "white", "startlinecolor": "#2a3f5f" }, "baxis": { "endlinecolor": "#2a3f5f", "gridcolor": "white", "linecolor": "white", "minorgridcolor": "white", "startlinecolor": "#2a3f5f" }, "type": "carpet" } ], "choropleth": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "type": "choropleth" } ], "contour": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "contour" } ], "contourcarpet": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "type": "contourcarpet" } ], "heatmap": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "heatmap" } ], "heatmapgl": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "heatmapgl" } ], "histogram": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "histogram" } ], "histogram2d": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "histogram2d" } ], "histogram2dcontour": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "histogram2dcontour" } ], "mesh3d": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "type": "mesh3d" } ], "parcoords": [ { "line": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "parcoords" } ], "pie": [ { "automargin": true, "type": "pie" } ], "scatter": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatter" } ], "scatter3d": [ { "line": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatter3d" } ], "scattercarpet": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattercarpet" } ], "scattergeo": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattergeo" } ], "scattergl": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattergl" } ], "scattermapbox": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattermapbox" } ], "scatterpolar": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatterpolar" } ], "scatterpolargl": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatterpolargl" } ], "scatterternary": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatterternary" } ], "surface": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "surface" } ], "table": [ { "cells": { "fill": { "color": "#EBF0F8" }, "line": { "color": "white" } }, "header": { "fill": { "color": "#C8D4E3" }, "line": { "color": "white" } }, "type": "table" } ] }, "layout": { "annotationdefaults": { "arrowcolor": "#2a3f5f", "arrowhead": 0, "arrowwidth": 1 }, "coloraxis": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "colorscale": { "diverging": [ [ 0, "#8e0152" ], [ 0.1, "#c51b7d" ], [ 0.2, "#de77ae" ], [ 0.3, "#f1b6da" ], [ 0.4, "#fde0ef" ], [ 0.5, "#f7f7f7" ], [ 0.6, "#e6f5d0" ], [ 0.7, "#b8e186" ], [ 0.8, "#7fbc41" ], [ 0.9, "#4d9221" ], [ 1, "#276419" ] ], "sequential": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "sequentialminus": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ] }, "colorway": [ "#636efa", "#EF553B", "#00cc96", "#ab63fa", "#FFA15A", "#19d3f3", "#FF6692", "#B6E880", "#FF97FF", "#FECB52" ], "font": { "color": "#2a3f5f" }, "geo": { "bgcolor": "white", "lakecolor": "white", "landcolor": "#E5ECF6", "showlakes": true, "showland": true, "subunitcolor": "white" }, "hoverlabel": { "align": "left" }, "hovermode": "closest", "mapbox": { "style": "light" }, "paper_bgcolor": "white", "plot_bgcolor": "#E5ECF6", "polar": { "angularaxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" }, "bgcolor": "#E5ECF6", "radialaxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" } }, "scene": { "xaxis": { "backgroundcolor": "#E5ECF6", "gridcolor": "white", "gridwidth": 2, "linecolor": "white", "showbackground": true, "ticks": "", "zerolinecolor": "white" }, "yaxis": { "backgroundcolor": "#E5ECF6", "gridcolor": "white", "gridwidth": 2, "linecolor": "white", "showbackground": true, "ticks": "", "zerolinecolor": "white" }, "zaxis": { "backgroundcolor": "#E5ECF6", "gridcolor": "white", "gridwidth": 2, "linecolor": "white", "showbackground": true, "ticks": "", "zerolinecolor": "white" } }, "shapedefaults": { "line": { "color": "#2a3f5f" } }, "ternary": { "aaxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" }, "baxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" }, "bgcolor": "#E5ECF6", "caxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" } }, "title": { "x": 0.05 }, "xaxis": { "automargin": true, "gridcolor": "white", "linecolor": "white", "ticks": "", "title": { "standoff": 15 }, "zerolinecolor": "white", "zerolinewidth": 2 }, "yaxis": { "automargin": true, "gridcolor": "white", "linecolor": "white", "ticks": "", "title": { "standoff": 15 }, "zerolinecolor": "white", "zerolinewidth": 2 } } }, "title": { "text": "3d TSNE Plot for Clusters" }, "width": 900 } }, "text/html": [ "
\n", " \n", " \n", "
\n", " \n", "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "plot_model(kmeans, plot = 'tsne')" ] }, { "cell_type": "code", "execution_count": 11, "metadata": {}, "outputs": [ { "data": { "text/html": [ " \n", " " ] }, "metadata": {}, "output_type": "display_data" }, { "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAf0AAAFlCAYAAADh+TGmAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4yLjEsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy+j8jraAAAgAElEQVR4nOzdd1QU1/vH8fdSRYqIwYaKFbBERLCDXdEkKHYlISaW2DDRJPYWUWNMFHuPJgYENbZo1NhilxBFxQb2rlFUlKL0/f3Bl/2FKIIKO8vyvM7xHHZ2duZzd8Fn752ZOyq1Wq1GCCGEEHrPQOkAQgghhNAOKfpCCCFEISFFXwghhCgkpOgLIYQQhYQUfSGEEKKQkKIvhBBCFBJS9IUibt++TfXq1enYsSMdO3bEy8uLnj17sn37ds06c+fOZfPmza/czoIFC9izZ89r7//fr8vNfl7H/v376dGjBx06dOD999/niy++4J9//smz7efWxo0bcXV11bzHmf9GjhwJwOjRo1mxYgUAjo6OPH78OF/zREZG0rp1azp37szt27ffaBthYWF88MEHWZb99NNPNG3alKioKMLCwnB0dGTUqFEvvNbX1xcXF5c32m9e2rdvH76+vnTs2JH333+fYcOGce/ePSDjMxswYMAbb/tN/x769+/P5cuX33i/ouAwUjqAKLyKFCnCb7/9pnl8584dPvnkEwwNDfH09OSLL77IcRthYWFUrVr1tff979flZj+5df/+fUaNGsXGjRuxs7MDYPHixQwbNow1a9bk2X5yy83NjaVLl2p9vy+zd+9eGjRowLRp0/Jsm7Nnz2bXrl2EhIRgZ2dHWFgYtra27Nu3j+fPn2NmZgZk/G5du3Ytz/b7prZu3crixYtZvHgx9vb2qNVqli1bxscff8y2bdveevtv+vewfPnyt963KBik6AudYWdnx+eff86KFSvw9PRk9OjRVKtWjb59+zJv3jx2796NsbExxYsXZ/r06ezevZuzZ8/y/fffY2hoSMOGDZk8eTJRUVGoVCo8PDz48ssvMTIyolatWrRq1YqoqCi8vLyyvG7v3r2a/Rw/fpzvv/+e58+fY2xszLBhw2jatCkbN25k9+7dGBgYcOPGDYoUKcKMGTOoUqVKljbExMSQkpLCs2fPNMt69+6Nk5OT5vHSpUvZtGkTRkZG2Nvb891332FpacnChQvZtm0bhoaGVKpUiQkTJmBra4uvry/FihXj6tWr9OrVC29vb6ZNm8bFixdJSUmhUaNGjBw5EiOjt/tznjNnDmfOnCE9PZ1hw4bRokULgJfmioiIYOXKlQQHBwPg6enJ+++/z+eff84///xD165dOXjwIAYGGYOJW7ZsISQkhLS0NBITE5k1a1au2+vr6/tC1vT0dPz9/YmKiiI4OJjixYtrnrO2tqZ8+fLs2bMHLy8vADZv3oyXl1eWL16//vorISEhpKenY21tzYQJE6hSpQrXrl3D39+fhIQEoqOjcXJyYs6cOZiamvLuu+/y2WefceTIER48eEC/fv3w8fEhOjqaUaNGERMTA0CzZs0YNmzYC7lnz57NlClTsLe3B0ClUvHZZ59RpkwZkpOTs6zr6+vLhx9+SLt27V54nJu/h2bNmjFz5kyOHTtGWloaNWrUYPz48VhYWNCyZUtq167NhQsX+PLLL5k+fTpz587l2bNnzJ49m/Lly3Pp0iVSU1OZPHkyrq6uPH78mDFjxnDz5k2sra2xtbWlWrVqDB069M1+4YQiZHhf6BQnJycuXryYZdm9e/dYtWoVGzZsYOPGjTRp0oTTp0/z4YcfUqtWLUaOHEmbNm2YOnUq1tbWbN26lQ0bNnDhwgVWrlwJQEpKCi1atGDnzp34+flleV2mmJgYPv/8c8aNG8fWrVuZMWMGI0aM4NatWwAcO3aMCRMm8Pvvv+Ps7MyyZctemr979+506tSJ9957j/Hjx7Nv3z48PDyAjN7uxo0bWbt2Lb///jvlypUjKCiIDRs2cOjQIdavX8/WrVupVq0ao0eP1mzXysqK7du34+vry7fffkvNmjXZuHEjmzdvJiYmhp9++uml7+fx48dfGN7fsGHDS9ctV64cmzZt4ocffmD06NE8fvw421zu7u5cuHCB2NhYbt++TUJCAkePHtW0sXXr1pqCD9ChQwd69uzJe++9x6xZs16rvf+VmprKiBEjCAkJYdCgQVkKfiZvb+8so0g7duzIcljg77//ZvPmzaxevZrNmzfTr18//Pz8AFi3bh3e3t6sW7eOXbt2cfv2bfbv3w9AcnIyxYsXZ82aNcybN4/p06eTlJTEunXrNO/f6tWruXHjBnFxcVkyxcTEcOfOHerWrZtluUqlokOHDlhYWLz0c/mv3P49LFu2DENDQzZu3MiWLVsoWbIkM2fO1GynWrVq7NixI8vfAMDp06fp06cPmzdvpnPnzsyePRuAqVOnUrVqVXbs2MHcuXM5ceJErvIK3SI9faFTVCoVRYoUybKsVKlSODk50alTJ5o2bUrTpk1p1KjRC689ePAgISEhqFQqTExM6NmzJ6tWreKzzz4DMoa6X+X06dNUqFABZ2dnIOM/xbp16/L333+jUqmoWbMmpUuXBqBGjRrs3r37pdsZPXo0AwYM4O+//+bYsWN8//33BAYGsnr1akJDQ2nXrh3FihUDYMyYMUDGIYbOnTtTtGhRAD7++GOWLFmi6f39O/v+/fs5c+YM69evByAxMTHbNr3O8H6vXr0AcHBwoEqVKpw8eZKDBw++NJeBgQGNGzfmyJEjxMTE0KNHD9auXUtcXBx//vkn/fr1e+W+stvuy9r7X9euXcPFxYUZM2YwevRoNm7cSJkyZbKs06JFC7755hsePnzIjRs3qFy5suY9h4z38MaNG/Ts2VOzLDY2lidPnjBixAiOHDnC8uXLuX79Og8ePMgyctOqVSsAatasSXJyMs+ePcPDw4PPPvuMe/fu0bhxY7766issLS2zZMr8EpSenv7K9yYnuf172L9/P3FxcZovYykpKZQoUULzfHbvcdmyZalevTqQ8Xu+adMmAA4cOKD5uWTJkpoRCFGwSNEXOuXMmTM4ODhkWWZgYEBQUBBnzpwhNDSUb7/9Fg8PD80JaZnS09NRqVRZHqempmoeZxaY7KSlpWV5PYBarSY1NRVjY+MsX0ZUKhUvu23F3r17efLkCV26dMHT0xNPT0+GDx9Os2bNOH/+PIaGhln2ERsbS2xs7GtlT09PZ+7cuZpDC7GxsS/kfhP/7pmnp6djZGT0ylytW7fm4MGDxMbG0q9fP65evcqePXu4ePEi9evXf+W+3uazqlixItOnTwfgxIkTDB06lODgYExMTDTrmJiY0LZtW7Zt28bly5fp1KnTC/vv2LEjI0aM0Dx+8OABxYoVY/jw4aSlpdG+fXuaN2/OvXv3snzWpqamAJr8arWa2rVrs3fvXkJDQ/nrr7/o1q0by5cvp1atWprXFStWjIoVKxIREUHjxo2z5Pniiy8YNGjQC239935TUlKA1/t7GDt2LM2aNQMgISGBpKSkHN/j7H7PjYyMsuT59++LKDjkUxM649q1ayxatIg+ffpkWR4VFcUHH3xAlSpVGDBgAJ988glnzpwBwNDQUFMs3N3dCQoKQq1Wk5yczLp16174zzXTv1+XqU6dOly9epXTp08DcOnSJY4dO5ZjAfs3c3NzAgICspwJfevWLQwNDalQoQKNGzdm9+7dxMfHAzB//nx+/vlnPDw82LBhg6ZHGRgYSL169bIUskzu7u78/PPPmnYOGjSIoKCgXGfMTmYv7ty5c9y8eRNnZ+dX5mrZsiWhoaFERkZSu3ZtmjRpwty5c2natCmGhoav3NfrtPe/jI2NNT+PGzeOtLQ0Jk+e/MJ63t7ebNq0iWPHjmkOr2Ryd3dn27ZtPHjwAICQkBB69+4NwOHDhxkyZAjvvfceABEREaSlpb0y08yZM1m0aBGtW7dm3LhxVK1alUuXLr2wnp+fH9OmTePGjRtAxhfNRYsWERUVReXKlbOsa2Njw9mzZwG4fPkyFy5cAF7v72H16tUkJyeTnp7OhAkTCAgIeGU7XqVZs2aa0aWYmBj27NmTJ182hXZJT18oJjExkY4dOwIZvQZTU1O+/PJLmjdvnmU9Jycn2rdvT5cuXShatChFihRh/PjxALRs2ZKAgABSUlIYP348U6dOxcvLi5SUFDw8PBg4cOBL9/3v12WysbFh7ty5TJkyhcTERFQqFdOnT6dSpUqcPHkyV21q2LAhEyZMYNSoUcTFxWFoaIitrS3Lly+nWLFiNGvWjMuXL2uG0qtWrcqUKVMoWrQo9+7do1u3bqSnp2Nvb5/l+Ou/jRs3jmnTpmna2bhx42yH0zOP6f9b5nHe/7p16xbe3t6oVCoCAgKwtrama9eu2eaytLSkSpUqmJmZYWhoiIeHB+PGjaNt27Y5vk+v2u7rMDU1Ze7cuXTq1InatWtTsWJFzXMuLi48f/6cli1bvnCSo7u7O/3796dPnz6oVCosLCxYsGABKpWK4cOHM2TIEIoWLYqFhQX16tXj5s2br8zRu3dvRo8ezQcffICJiQmOjo68//77L6zn5eWFWq3myy+/JDU1laSkJGrWrMmqVate+MIzaNAgRo8ezYEDB6hcubJmOD63fw+DBw9mxowZdOrUibS0NKpXr57lvInXNWbMGMaPH4+XlxfW1taULVv2hUNxQvep5Na6QgghcrJ69Wpq1KiBi4sLycnJ+Pj4MHToUM3hA1EwSE9fCCFEjjJHpdLT00lJSaFdu3ZS8Asg6ekLIYQQhYScyCeEEEIUElL0hRBCiEJCr4/pp6enk5CQgLGxsVxaIoQQolBQq9WkpKRgbm7+wnwKel30ExISXpjSVQghhCgMHBwcXpgZUq+LfuYkHg4ODrma9CO3zp49m2WmrYJKX9rRvn17UlJS3uiWorpIXz4X0J+26Es7QNqii/K6HcnJyVy8eDHLRFaZ9LroZw7pm5iYaKbOzCt5vT2l6EM7FixYwPnz5/WiLZmkLbpHX9oB0hZdlB/teNlhbb0u+qJwqFGjBs+fP1c6hhBC6Dw5e18IIYQoJKSnLwo8Z2dnkpOTiYyMVDqKEELoNOnpCyGEEIWEFH0hhBCikJCi/5om74xg2ekHSscQQgghXpsc038Nk3dG4L/rNABld0YwydNZ4URCCCFE7klPP5f+XfAB/HedZvLOCAUTCSGEEK9Hevq58N+CnylzmfT4lTV06FBu3rypdAwhhNB5UvRzkF3BzySFX3n9+vUjPDxc6RhCCKHzZHhfCKH3mjVrppnHoVmzZpw7d07hRFk1a9aM8+fPKx1DFAJS9HMwydOZiW1rZ/v8xLa1pZevsIEDB/Ldd98pHUPoqKdPn/Lw4UOqVKlCbGwsDx48oHLlyorl8fDwyDKR1NOnT4mOjqZKlSr5sr/r16/z7rvv8vXXX+fL9nVRdm3etm0b7du3p06dOrRu3Zrjx48DGTeoGTt2LC1atMDFxQVvb28OHDiQ5bUuLi5Z/lWvXp0pU6ZkWSc327l9+zb9+/enXr16NGnSBH9/f9LS0jTPBwUF0blzZ2rVqsXo0aPz8m0BZHg/VzKL+n+H+aXg64bQ0FCSk5OVjiF01MWLF6lYsSImJiacPn2aMmXKYGZmpkiWx48f8/jx4ywF/uLFi1SoUCHfbhzj7+/Pu+++my/bfhNpaWkYGhrm6z5e1uYjR44wc+ZMZs+eTe3atYmOjtY8l5qaSpkyZQgMDKRs2bIcOHCAYcOGsXXrVsqVKwfAyZMnNes/e/aMJk2a0K5duyz7yM12Jk+eTIkSJTh8+DCxsbH06dMHQ0ND6tevD0DJkiUZPHgwhw4dIikpKc/fG+np59J/e/zFihgzvo3u/CEJUditW7eO9957D1dXV/r168ejR48AuHDhAg4ODpqfK1WqxPTp06lXrx5t27bV9PYA1Go1y5Yto0WLFri5ufHFF18QFxcHZPT07t27B0BISAiOjo48fPgQgB9//JFx48YB8OjRIwYOHEjjxo2pW7cuAwcOJD4+nhs3btC8eXPS09Np0KABDRo0IDU1NUu+58+f89VXX+Hn50dCQsJbvyfbtm3D0tKSRo0a5fo1t27dYsCAATRo0ABXV1c+/fRTzXO///47nTt3xtXVldatWxMWFvbK9wzg119/pU+fPowdO5Z69erx008/Adl/XvnV5vnz5zN48GDq1KmDgYEBpUqVolSpUgAULVqUoUOHUq5cOQwMDGjRogXlypXL9jDQzp07sbGxwc3NLcvy3Gzn9u3btG/fHlNTU2xtbXF3d+f27dua59u2bUvr1q2xtrbOk/fjv6Tov4bMwu9U3JSniSn8fv6O0pGEUIyzs/NL//3444+adb777ruXrtO3b1/NOqtWrXrpOq9jyZIlrFmzhsWLFxMaGkqpUqWYM2cOkFHoHR0dNT+fPn2aevXqcfToUTp06MCECRM025kzZw6HDh1i7dq1HDlyhOTkZBYuXAiAlZUVCQkJqNVqgoODsbe35+nTp6jVatauXYuvry8A8fHx+Pr6sn//fv78809iYmJYs2YN9vb2jBo1Ck9PT06ePElYWBhGRkaaon/r1i18fHyoVKkS8+fPx9zcXJNrwIABuLm5vfTfgAEDXvqexMfHM2/evNceIh45ciRNmzbl6NGjHD16FD8/PwBWrlzJ4sWLmTJlCseOHWPhwoXY2dm98j3LfM9PnjxJq1atCAsL4+OPP37l55UfbU5LS+Ps2bPExMTQpk0bmjZtir+/P4mJiS/dzsOHD7l+/TpVq1Z96fObNm3C29v7pbeuzWk7H3/8Mdu2beP58+fcv3+fQ4cOvfbv+9uQ4f3XNMnTGSejeHy2X2Xh4Sg61iqvdCQhCrVHjx6xePFiNm/ejL29PQBdu3Zl8uTJQMbwecuWLTU/9+7dm9atWwPQrVs3FixYQGpqKk+ePCEoKIjt27dTsmRJADw9PVm/fj1t2rTBysqKZ8+ecfjwYSpUqABAXFwcBw8epFSpUjg5OQFgb2+vyWFiYkLjxo2JjY0FICoqiurVq2fJf/HiRVQqFb1792bs2LGabP+2dOnS135f5syZQ5cuXShTpsxrve7WrVukpaWRlpaGqakprq6uPH78mAULFhAcHKxpZ+ZIR3bvWaaoqCj69u1Lq1atgIz37FWfV360+eHDh6SkpPDHH3+wevVqjIyMGDx4MIsXL2b48OFZ1k1JSeHrr7+mU6dOLz3P4u7duxw7doxp06a9Mkt226lfvz6//vorrq6upKWl0alTpxdGDPKTFP03UNW6CM2rlGLvpX+IvP+U6qWKKR1JCK2LiMh5cqrRo0fj6ur6ynV69+5N79693zhHaGgoKSkpdOvWTbNMrVZTo0YN1Go1Fy9e1AyfX7p0ialTp2rWi4mJwdLSEiMjI44fP46Dg4NmyBfgyZMn2NraAv/f01+1ahX9+/dn48aNPH36lJCQEE0vH2DHjh2sWrWKGzdukJKSQmJiIv7+/gBERkZmKeqZ+W7dusUnn3zy0oL/JiIjIwkNDWXTpk2v/doffviBJUuWsHDhQlq1asXIkSM5evQoDg4OmoKfKaf3DDJ6+t98843m8as+r7fxqjYXKVIEAF9fX82Xk08//fSFop+ens7IkSMxNjbOMgL0b5s3b8bV1ZXy5bPv8GW3nfT0dPr27UuPHj1Ys2YNCQkJjB07lpCQEK0Vfin6b2iIuxP7r9xn4eEoFnRpoHScQs3NzY2YmBilYwiFPH36lNatWzNv3rwXnrt16xYGBgbY2dlx584d4uPjsbGx0Ty/a9cumjdvDmScZGdpaZnl9Xv37sXT0xMAS0tLzp49S3R0NA0aNGDXrl1cuHCBixcvaop1aGio5mSxzCLWsmVLqlevTnp6OpcuXcpSODOP5f7000988sknNGrU6KUn3b1qLgpXV9csh1QAwsLCuHPnDi1atAAyTjzL7FWOHz8++zcTaNSoEY0aNeLRo0f079+fTZs2YWJigpWV1Qvr5vSe3blzh9TU1CxXS7zq88qvNm/atInSpUu/cjherVYzbtw4Hj58yPLlyzE2Nn7per/99hv9+/d/o+08efKEe/fu8dFHH2FiYoKJiQldunRh+vTp2W4vr0nRf0MdapajvHVRfjl+lWnvuVDMzETpSIXWihUrZHKeQqxGjRrMmzePc+fOUbNmTeLj4/nrr79o1apVlpPkLl68iJGREVu3bsXX11dzHHr16tUAvPvuu8yZM4ebN29SokQJfvzxRx4+fEiXLl04f/48xYoVY9WqVQwbNgwACwsLfvnlFz7++GPN2egXLlygTJkyVK5cmdjYWL777jvN2fqJiYkkJiaiVqs12TPPN3B0dGTKlCn4+fnx66+/anqjmf5b4HLSo0cP3n//fc3jlStXcufOHb755huuXbumOeb930tdd+3ahYODA/b29iQkJBAbG4uTkxOmpqYEBAQQFRWFo6MjN27cIC0t7ZXvGWQM7Ts4OGBg8P+nj73q8/p3Uc7LNgN07tyZwMBAPDw8MDIyYtWqVZovfACTJk3iypUr/PTTT5qRgf86ceIE9+/ff+Gs/X971XZsbGwoV64cISEh9OnTh2fPnrFp0ybN4SLIuAIgLS2N9PR00tLSSEpKwtDQECOjvCnXUvTfkJGhAQMbOzBu+ylWHbvC502r5/wiIUSec3FxYciQIQwdOlQzXN+iRQtat26d5SS+ixcv0rFjR06cOMG8efOoVKkSixYtomLFikBG0R84cCA+Pj4kJibSuHFjVq1apbm8z8rKitTUVLy8vAAwNzcnNjY2yzC1l5cXf/zxB+7u7lSrVo3mzZtTpUoVTa+uZ8+evPfee1hYWHDw4MEs+TLzDhkyhKCgoLe6hM/MzCzLZYlFixbFxMQEGxsbrl27xr1797IUyEzh4eH4+/uTkJBAyZIl+eyzzzRnwQ8aNIgBAwYQGxuLnZ0dM2bMyPE9i4qKeuGQwKs+r7fxqjYDDB48mJiYGDw9PTE1NaV9+/YMGjQIyBiRWLt2LSYmJri7u2u2MXnyZDp06KB5vHnzZtq0aYOFhUWWfffr1w83Nze8vLxy3M6CBQv49ttvWb58OQYGBjRo0CDL4aHFixezYMECzeMtW7bg5+fH0KFD3+r9yaRS//trp55JSkri7Nmz1KpVK0+vgQ0PD8fV1ZWH8YlUmLKB8tbmRI7qiIHBq8/k1DWZ7SjoVq1axc2bN7M9BlfQ6MvnAvrTFn1pB2QMg3/zzTds2bIl2yHsgkJfPpe8bserap9csvcW3rEoQk+XSlx+GMfOC3eVjlNoBQQEEBwcrHQMIQoEIyMjduzYUeALvngzUvTfkp97xtDcgsNRCicRQgghXk2K/luqW64EjSva8kfUXS5FxyodRwghhMiWFP08MOR/vf3FRy8onEQIIYTInhT9PNCltj1lrMz46e8rxCelKB1HCCGEeKl8LfoRERGaSxFu3LhBr1698PHxYdKkSaSnpwMZN13o3Lkz3bt3Z9++fQAkJiYydOhQfHx86N+/P48fPwbg1KlTdOvWjZ49e2a5pEFpxoYGDGjkQGxiCoHhV5WOI4QQQrxUvhX95cuXM378eM2tAadPn86wYcMIDg5GrVazd+9eoqOjCQwMZM2aNaxYsYKAgACSk5MJCQnBwcGB4OBgvL29WbRoEZAx6cGsWbMICQkhIiIi2zsgKaF/w2oYGxqw6PAF9PgqSJ107NgxzZ27hBBCZC/fin6FChWYP3++5vG5c+c09wvOvIPT6dOncXFxwcTEBEtLSypUqEBUVBTh4eF4eHho1g0NDSU+Pp7k5GQqVKiASqXC3d2d0NDQ/Ir/2kpbmdG1dgXO33/Kn5f+UTpOoWJiYiKXHwkhRC7k24x8np6eWe4RrFarNVMsmpubExcXR3x8fJZ5m83NzYmPj8+y/N/r/nsWJHNzc27dupWrLGfPns2LJmXxsmlfW9tCCDB1WxjWcQXj7nv6MH3tzZs3lY6Q5/Thc8mkL23Rl3aAtEUXaasdWpuG999zLyckJGBlZYWFhQUJCQlZlltaWmZZ/qp1X3YDiJfJrxn5/quuWs3iyDgO335MiUqOVLSxeMmrdYe+zGbVp08fkpOTiYyMVDpKntCXzwX0py360g6Qtuii/JqR72W0dvZ+jRo1CAsLA+DgwYO4ublRu3ZtwsPDSUpKIi4ujitXruDg4EDdunU5cOCAZl1XV1csLCwwNjbm5s2bqNVqDh8+rNV7EOeGSqViiLsj6Wo1i4/I5XtCCCF0i9aK/qhRo5g/fz49evQgJSUFT09PbG1t8fX1xcfHh969ezN8+HBMTU3p1asXly5dolevXqxduxY/Pz8g46YFX3/9NV27dqVGjRo4OztrK36u9ahTEVsLU1aEXeZZcqrScYQQQgiNfB3eL1euHOvWrQOgUqVKBAUFvbBO9+7d6d69e5ZlZmZmL73Xcp06dTTb01WmRob0b1iNb/ecJeTkNfo2qKZ0JCGEEAKQyXnyxYBGDhgaqFgol+8JIYTQIVL080E5a3O8a5Un4m4Mh689UDqOEEIIAUjRzzd+7k4ALDgsJ/Tlt7lz5/Lll18qHUMIIXSe1i7ZK2w8KpekdpnibDpzk9tPEihnba50JL3VvHnzLPM9CCGEeDnp6eeTzMv30tLVLA29qHQcIYQQQop+fvKpW4niZiYs/+sSiSlpSsfRW61bt9Zc1imEECJ7UvTzUVETI/o2qEp0fBK/RtxQOo7eio6O5smTJ0rHEEIInSdFP58NauKIgUrFwsNRSkcRQghRyEnRz2cVbSz4oIYdx249IuxGtNJxhBBCFGJS9LVALt8TQgihC6Toa0HLaqWpXqoYv0bc4J/Y50rHEUIIUUhJ0dcClUrFkCaOpKSls/yvS0rH0Ts9e/akTZs2SscQQgidJ0VfS3zdKmNVxJiloRdJTpXL9/LSmDFj6N27t9IxhBBC50nR1xILU2M+qVeFe7HP2XjmptJxhBBCFEJS9LVocBNHABbJCX15asKECSxdulTpGEIIofNk7n0tqmZrRTunsvwRdZeTtx/jUs5G6Uh6YcuWLSQnJysdQwghdEB9yCAAACAASURBVJ709LXs/y/fk8l6hBBCaJcUfS3zdCxL1XcsCTl5jYfxiUrHEUIIUYhI0dcyAwMVg5s4kpSazoqwy0rHEUIIUYhI0VfAJ/WqYG5ixOKjF0hNS1c6jhBCiEJCir4CipmZ4OtWmVtPnrHl3G2l4xR49vb2lC5dWukYQgih86ToK2TI/y7fk7vvvb0tW7Ywc+ZMpWMIIYTOk6KvkBqlrWlVrTT7r9znzL0YpeMIIYQoBKToK2jI/y7fW3REJut5G9u3b+fo0aNKxxBCCJ0nRV9BH9Swo6KNOUHhV4l5lqR0nAJrzJgxLFq0SOkYQgih86ToK8jQwIBBjR15lpzGz8euKB1HCCGEnpOir7A+DapSxMiQRUcukJYul+8JIYTIP1L0FWZT1BSfupW4+iieHVF3lY4jhBBCj0nR1wF+HhmX7y04JJfvCSGEyD9S9HWAc1kbPCqXZPfFe1x48FTpOEIIIfSUFH0dkXn53sLDcvne69q+fTuzZ89WOoYQQug8Kfo6wrtWeeyKFWXV8SvEJsq94V+HnZ0dtra2SscQQgidJ0VfRxgbGjCwsQPxSakEHr+qdJwC5cmTJ8TFxSkdQwghdJ4UfR3Sr0FVTAwNWHj4AunpaqXjFBjNmjVj0KBBSscQQgidJ0Vfh5S0NKOHS0UuRMey59I9peMIIYTQM1L0dYzf/07oWyB33xNCCJHHpOjrGLfyJWhQ4R22R97h6iM5Ti2EECLvSNHXQUPcHVGr5e57Qggh8pYUfR3UzdmeUpZF+OnvKyQkpSgdRwghhJ6Qoq+DTIwM+ayhA0+eJ7P6xDWl4+i8CRMm0KdPH6VjCCGEzpOir6M+a1QNIwMVCw9fQK2Wy/depWvXrrRs2VLpGEIIofOk6OuossWK0qW2PWf/ecKBK/eVjiOEEEIPSNHXYX7u/7v7nszH/0o9e/Zk/PjxSscQQgidZ6R0AJG9RhVtqVvOht/O3uJmTAIVipsrHUknRUZGkpws9ysQQoicSE9fh6lUKgY3cSRdrWbJUentCyGEeDtS9HVcT5eKlChqyo9/XeZ5SqrScYQQQhRgUvR1nJmxEf0aVuXRsyTWnLyudBwhhBAFmBT9AmBgY0cMVHL5nhBCiLcjRb8AqFDcnI61ynPyzmNCr0crHUfntGrVCjc3N6VjCCGEzpOiX0DI5XvZCwgIYNiwYUrHEEIInSdFv4BoVqUUtUpbs+H0De4+faZ0HCGEEAWQFP0CQqVSMcTdkdR0NctCLykdR6fMmzePtWvXKh1DCCF0nhT9AuTDupWwNjNh2V8XSU5NUzqOzlixYgVbt25VOoYQQug8KfoFiLmpMZ/Wr8L9uER+jbihdBwhhBAFjBT9AmZwE0dUKlgoJ/QJIYR4TVL0C5jKJSx5r7odYTcfcuzmQ6XjCCGEKEC0esOdlJQURo8ezZ07dzAwMGDKlCkYGRkxevRoVCoV1apVY9KkSRgYGLBu3TrWrFmDkZERgwYNokWLFiQmJjJixAgePXqEubk5M2bMwMbGRptN0Al+7k5sO3+HhUcu8HOFd5SOI4QQooDQak//wIEDpKamsmbNGoYMGcKcOXOYPn06w4YNIzg4GLVazd69e4mOjiYwMJA1a9awYsUKAgICSE5OJiQkBAcHB4KDg/H29mbRokXajK8zWlcrg6OtFWtPXudB3HOl4yiuaNGiFClSROkYQgih87Ra9CtVqkRaWhrp6enEx8djZGTEuXPnqF+/PgBNmzbl6NGjnD59GhcXF0xMTLC0tKRChQpERUURHh6Oh4eHZt3Q0FBtxtcZBgYZl+8lp6XzY9hlpeMoLjQ0lB9//FHpGEIIofO0OrxftGhR7ty5Q/v27YmJiWHJkiUcO3YMlUoFgLm5OXFxccTHx2Npaal5nbm5OfHx8VmWZ66bG2fPns3ztoSHh+f5Nl/Hu0ZpmBsZMH//WVoVS8LIQPVG21G6HXlJ2qKb9KUt+tIOkLboIm21Q6tF/+eff8bd3Z2vvvqKe/fu0bt3b1JSUjTPJyQkYGVlhYWFBQkJCVmWW1paZlmeuW5u1KpVC1NT0zxrR3h4OK6urnm2vTf16b2MaXlvmtjSzdn+tV+vK+14W8eOHSMqKgpfX1+lo+QJfflcQH/aoi/tAGmLLsrrdiQlJWXb2dXq8L6VlZWmp16sWDFSU1OpUaMGYWFhABw8eBA3Nzdq165NeHg4SUlJxMXFceXKFRwcHKhbty4HDhzQrKsPH/bbGNwkYz7+hYejFE6irH79+vHtt98qHUMIIXSeVnv6n3zyCWPHjsXHx4eUlBSGDx9OrVq1mDBhAgEBAVSuXBlPT08MDQ3x9fXFx8cHtVrN8OHDMTU1pVevXowaNYpevXphbGzMrFmztBlf5ziWLEYbhzLsvniPiLuPcS5b+K5kEEIIkXtaLfrm5ubMnTv3heVBQUEvLOvevTvdu3fPsszMzIx58+blW76CyM/Did0X77Hw8AWWdW+kdBwhhBA6TCbnKeDaO5WlcgkLgk9c4/GzJKXjCCGE0GFS9As4QwMDBjdx5HlKGivl8j0hhBCvIEVfD3xavypFTQxZfPQCaenpSscRQgiho6To6wFrMxM+cq3M9ccJ/H7+jtJxtG7VqlVMnDhR6RhCCKHzpOjriSGF+PK9OnXq4ODgoHQMIYTQeVL09UStMsVpUbUUey/9w/l/nigdRwghhA6Soq9HBjdxAmDhkQsKJ9EuNzc3evfurXQMIYTQeVL09UiHmuUob12UwONXefo8Wek4WpOSkkJaWprSMYQQQudJ0dcjRoYGDGrsSEJyKquOXVE6jhBCCB0jRV/P9G1QFVMjAxYeuUB6ulrpOEIIIXSIFH09845FEXq5VOLywzh2XrirdBwhhBA6RIq+HvJzzzihb0EhvHxPCCFE9nJV9J89e0ZUVBRqtZpnz57ldybxllzK2dCkoi1/RN3lUnSs0nHy3cCBA+ncubPSMYQQQuflWPRDQ0Pp2LEjgwcP5uHDh7Ro0YLDhw9rI5t4C0P+19tfVAgu3xs0aJAUfSGEyIUci35AQADBwcFYWVlha2vL6tWr+f7777WRTbyFzrUrUMbKjJ+PXSE+KUXpOEIIIXRAjkU/PT0dW1tbzeOqVavmayCRN4wNDRjQyIHYxBQCj19VOk6+Gjp0KLNmzVI6hhBC6Lwci37p0qXZt28fKpWK2NhYFi9eTNmyZbWRTbyl/g2rYWyYcfmeWq2/l+8dPHiQkydPKh1DCCF0Xo5F39/fn61bt3Lv3j3atGlDZGQk/v7+2sgm3lJpKzO6OdsTef8pf176R+k4QgghFGaU0wq//PILAQEB2sgi8oGfuyPBJ66x4HAUrRzKKB1HCCGEgnLs6e/bt0+vh4b1XQN7W+qVL8Hv5+9w/XG80nGEEEIoKMeevrW1Ne3ataNmzZqYmppqlk+fPj1fg4m8M8TdiU9CjrD4yAVmeLkqHUcIIYRCciz6nTp10kYOkY+617Fn5NZwVoRdZpKnM0VNcvzYCxRnZ2diYmKUjiGEEDovx+H9Tp06UbNmTRISEnj69ClOTk7yRaCAMTUypH/DasQ8Tyb4xDWl4+S5X375hW+++UbpGEIIofNyLPqbN29m8ODB3L59m7t37+Ln58f69eu1kU3koc8aVcPQQMXCw/p9+Z4QQojs5TjO+9NPP/Hrr79SvHhxIGOe848//piuXbvmeziRd8pZm9Pp3Qqsj7jB4WsP8KhcSulIeSY4OJjr16/j6irnKwghxKvkaka+zIIPYGNjg0qlytdQIn/4uTsCsOCwfs3HP2PGDAIDA5WOIYQQOi/Hnr6joyPTpk3T9Ox//fVXnJyc8j2YyHvulUriXLY4m87c5PaTBKXjCCGE0LIce/pTp07FxMSEsWPHMmbMGExMTJg0aZI2sok8plKpGOLuSFq6mg+DDrHs9AOlIwkhhNCiHIu+sbExdevWZcOGDfz4449UrlwZc3NzbWQT+cCnbiWKGBlw+Fo0P559yOSdEUpHEkIIoSU5Fv3x48eza9cuzeOwsDDp6Rdg3/95jsTUdM1j/12npfALIUQhkeMx/bNnz7J161Yg4yS+H374AS8vr3wPJvLe5J0R+O86/cLyzGWTPJ21HUkIIYQW5Vj009PTefDgASVLlgTg0aNHGBjkOEAgdEx2BT9TQS78R44c4dSpU0rHEEIInZdj0R84cCCdOnXSXAMdERHBuHHj8j2YELllYWGBmZmZ0jGEEELn5Vj0vby8qF+/PqdOncLIyIgJEyZga2urjWwiD2X24LPr7Y9v826B7OUDXL9+nXv37ikdQwghdF6O4/Q3b94kLCyMNm3asH//fgYOHMjZs2e1kU3ksUmezkxsW/ulz5kZG2o5Td7p2LEjI0aMUDqGEELovByL/pgxY0hPT+fPP//k+vXrjBkzhqlTp2ojm8gH/y38XzevgV2xokz8I4K/bkQrmEwIIUR+y7HoJyUl4e3tzb59+/Dy8sLNzY3k5GRtZBP5JLPw96v1DjO8XAn80J10dcaEPU+fy2crhBD6Kseib2hoyM6dO9m/fz/Nmzdnz549cva+Hpjk6cxntTOuyGhWpRTjWr/L9ccJDFz/l9yFTwgh9FSO1dvf35/9+/czceJESpYsybZt22R4Xw9NaFObJhVtWXfqBj/9fUXpOEIIIfJBrm64M336dM3j2bNn52sgoQwjQwMCP3SnbsA2vtj8N40r2uJUqpjSsYQQQuQhGacXGvY2Fizt1pBnyWn4BB0iMSVN6Ui5MnPmTD7//HOlYwghhM6Toi+y6OpsT/+G1Yi4G8OYbSeUjpMrbdq0oX79+krHEEIInZfj8D5AfHw8cXFxWU7wKlu2bL6FEsoK6OjG4WsPmHcoilYOZfigRjmlIwkhhMgDORb9JUuWsGzZMqytrTXLVCoVe/fuzddgQjlFTYwI/siDhnO303fNUU5+9QFlixVVOla22rdvT3x8PIcOHVI6ihBC6LQci/769evZs2cPNjY22sgjdETtssWZ6eXG0E1/0zv4CH8MaIWhjl6qeffuXZk7QgghciHH/8XLlClDsWJyFndhNKiJAx1qluPPy//ww75zSscRQgjxlnLs6VesWBEfHx8aNGiAiYmJZrmfn1++BhPKU6lU/NijMS6zfmfiHxE0r1qahvZysyUhhCiocuzplypVCg8PjywFXxQeJcxNZZpeIYTQEzn29P38/Hj8+DERERGkpaVRp04d3nnnHW1kEzoic5reqbvPMHD9XwR/5IFKpVI6lhBCiNeUY0//0KFDdOzYkY0bN7Jp0yY6dOjAvn37tJFN6JAJbWrT+H/T9P58TLem6e3SpQstWrRQOoYQQui8HHv6s2fPJjg4mPLlywNw69Yt/Pz85D/ZQsbI0ICgD91xmfU7n2/KmKbXsaRunOA5ceJEwsPDlY4hhBA6L8eefmpqqqbgA5QvX5709PR8DSV0k72NBUu7N8qYpjfwEEmpBWOaXiGEEBlyLPply5bl559/Jj4+nvj4eH7++Wfs7Oy0kU3ooG7O9vRrWJVTd2MY/btuTNPr7+/PihUrlI4hhBA6L8eiP23aNE6dOkXr1q1p1aoVJ0+exN/fXxvZhI6a3bEe1UsVY96hKH4/f1vpOGzYsEHOMxFCiFzI8Zh+iRIlmDNnjjayiAKioE3TK4QQIkO2RX/AgAEsXbqUli1bvvTyrDede3/p0qX8+eefpKSk0KtXL+rXr8/o0aNRqVRUq1aNSZMmYWBgwLp161izZg1GRkYMGjSIFi1akJiYyIgRI3j06BHm5ubMmDFDpgdWSEGaplcIIUSGbIv+lClTAAgMDMyznYWFhXHy5ElCQkJ4/vw5K1euZPr06QwbNowGDRowceJE9u7dS506dQgMDGTDhg0kJSXh4+NDkyZNCAkJwcHBgaFDh7Jt2zYWLVrE+PHj8yyfeD2Dmjiw6+Jdtp67zcx95xnVqpbSkYQQQrxCtl2zkiVLAvDdd99hZ2eX5d/YsWPfaGeHDx/GwcGBIUOGMHDgQJo3b865c+c090Jv2rQpR48e5fTp07i4uGBiYoKlpSUVKlQgKiqK8PBwPDw8NOuGhoa+UQ6RN1QqFSt6NMauWFEm/HGKv25EKx1JCCHEK2Tb0/fz8yMyMpL79+/TqlUrzfK0tDRKly79RjuLiYnh7t27LFmyhNu3bzNo0CDUarXm8IG5uTlxcXHEx8djaWmpeZ25ubnm6oHM5Znr5sbZs2ffKO+r6Mt14XnRjvFutgzee4NuK/YS1L4yFiaGeZAs96ysrAD9+UxA2qKL9KUdIG3RRdpqR7ZF/7vvvuPJkydMnjyZb7755v9fYGREiRIl3mhn1tbWVK5cGRMTEypXroypqSn//POP5vmEhASsrKywsLAgISEhy3JLS8ssyzPXzY1atWphamr6RplfJjw8HFdX1zzbnlLyqh2uwG3VKabtOcPSy0ms/shdq9P0Hjp0SG8+E9Cf3y/Qn7boSztA2qKL8rodSUlJ2XZ2sx3et7CwoFy5cjx8+DDL0H6pUqUwMsrxpP+XcnV15dChQ6jVau7fv8/z589p1KgRYWFhABw8eBA3Nzdq165NeHg4SUlJxMXFceXKFRwcHKhbty4HDhzQrKsPH7a+mNi2No3sbVl76rrOTdMrhBAiQ47V+5133uH48ePUrl37re+016JFC44dO0bXrl1Rq9VMnDiRcuXKMWHCBAICAqhcuTKenp4YGhri6+uLj48ParWa4cOHY2pqSq9evRg1ahS9evXC2NiYWbNmvVUekXeMDA0I+sidugpM07t7924uX74sXwKFECIHORb9M2fO8NFHH2VZplKpiIyMfKMdjhw58oVlQUFBLyzr3r073bt3z7LMzMyMefPmvdF+Rf6r+L9penv+chCfwEMc/aI9pkb5f3z/66+/Jjk5mUGDBuX7voQQoiDLsej/9ddf2sgh9EQ3Z3t2N6jKirDLjNl2goCO9ZSOJIQQ4n9yLPrPnz9nwYIFhIaGkpaWRsOGDfniiy8oWlRmYBMvN8e7HkevRzP3YBStqpXh/RrllI4khBCCXMy97+/vz/Pnz/n222+ZMWMGKSkpTJo0SRvZRAFV1MSI1R+5Y2pkQJ81R7kX+0zpSEIIIchF0T937hwTJ07EyckJJycnJk6cyLlz57SRTRRgzmVt+MHLlYcJSfQOPkJ6ulrpSEIIUejlWPTVajWxsbGax7GxsRgaanfyFVEwDW7iyAc1yrH30j/M3C9fFIUQQmk5HtP/5JNP6NatGy1atADgzz//pH///vkeTBR8GdP0NsJl1u9M2HGKZlVK0cDeNs/389tvv+XLrItCCKFvcuzpd+nShXnz5lG+fHns7OyYP38+3bp100Y2oQfesSjCLx+6k6ZW82HQYZ4+T87zfVSsWJEyZcrk+XaFEELf5Fj0hw4diqOjIx9++CG+vr44OjrSu3dvbWQTeqJF1dKMaVWLa4/jGbQ+DLU6b4/vx8fH8/z58zzdphBC6KPXvuFOamqq9KrEa5vY1pl9l+6z9tR12jqW5ZP6VfJs202aNCE5OfmNJ4wSQojCIscb7kybNi3LPevf5oY7ovAy/s80vY0qvqO1aXqFEEJkyPGGO3PnziUuLg47OztOnDjBzz//nOVsfiFyK3Oa3oTkVD4MOkxSaprSkYQQolDJ8Zj+iBEj2Lp1KxEREcyfPx8LCwvGjBmjjWxCD3Vztqdvg6qcvPOYsdtOKh1HCCEKlRyL/u3btxkxYgS7du2ia9euDBkyhIcPH2ojm9BTszu64VTSijkHI9keeUfpOEIIUWjkWPTT0tJ4/Pgxe/bsoXnz5kRHR5OUlKSNbEJPmZsaE+zrgYmhAX3WHJFpeoUQQktyLPp9+/ale/fuNGvWDAcHBz766CMGDx6sjWxCj2VO0xsd//bT9I4aNQpfX988TCeEEPopxxn5vLy88PLy0jzevn27TMMr8sQQd0d2XbzLtvN3mLn/HCNb1nqj7fj4+BAeHp7H6YQQQv9kW/QHDBjA0qVLadmyJSqV6oXn9+7dm6/BhP5TqVSs7NGYOvk8Ta8QQogM2Rb9KVOmABAYGKi1MKLweceiCIEfutNmyW4+DDpM+JfvU8zM5LW28fHHHxMTE8PWrVvzKaUQQuiHbIv+0aNHX/lCOzu7PA8jCqfMaXq/3XOWwRvCCPrQ/aWjS9mJiIggOTnv5/QXQgh9k23RDwsLA+DmzZvcuHGDZs2aYWhoyOHDh6latSre3t5aCyn0X+Y0vWtOZkzT27te3k3TK4QQIkO2RX/69OkA+Pr6smXLFmxsbAB4+vQpQ4YM0U46UWhkTtPrMut3hm78m0YVbXGwtVI6lhBC6JUcL9l78OAB1tbWmsdmZmZER0fnayhROFW0sWBJ14YkJKfiE3hIpukVQog8luMle82bN+fTTz+lbdu2qNVqduzYQfv27bWRTRRCPVwqsufiPVb+fZmx204yq6Ob0pGEEEJv5Fj0x4wZw86dO/n7779RqVT06dMny612hchrc7zdOHLtAXMORtLKoQzvVX/1SaNNmzbl0aNHWkonhBAFV45FH8DT0xNPT8/8ziIE8P/T9Daau4M+a45w8qsPKGNVNNv158+fL5PzCCFELuR4TF8IJdSxs+F7r7p5Mk2vEEKIDFL0hc7yc3fi/Rp27L30D7P2n892vcWLF7Nx40YtJhNCiIJJir7QWZnT9JaxMmP8jpP8ffPlt3ResmSJFH0hhMgFKfpCp71jUYRffJqQplbzYdAhYhNl5j0hhHhTUvSFzmtZrQyjW9bi6qN4Bq0PQ62W4/tCCPEmpOiLAmGSpzMN7d9hzcnr/HL8qtJxhBCiQJKiLwoEY0MDgj50x6qIMUM3/s3F6FilIwkhRIEjRV8UGJVKWL50ml5jY2MMDQ0VTieEELpPir4oUHq4VOTT+lU4eecx47afBMBr2gqafPWDwsmEEEL35WpGPiF0yVzvehy9Fs3sA5H8E/uckJPXASi7M4JJns7KhhNCCB0mPX1R4GRO02uggpCT1zF4eAuDh7fw33WayTsjlI4nhBA6S4q+KJB+O3uLzJl5zfetxHzfSgAp/EII8QpS9EWBM3lnBP67Tmf7vBR+IYR4OSn6QgghRCEhRV8UOJM8nZnYtna2z1cuYUGHmuW1mEgIIQoGKfqiQMqu8FeyMefqo3jcZm/DJ/AQlx/KJD5CCJFJir4osP5b+Ce2rc3lcZ3ZOaA1ruVsWHvqOjVnbGHw+jDuxT5TMKkQQugGuU5fFGiTPJ25N3IKDx9Ga67Rb+1QhlbV3mPD6ZtM2HGKpaEX+eX4Fb5oWp0RLWpibWaicGohhFCG9PRFgbfErxdjvJpkWaZSqejqbM+ZEV4s6daQ4mYmfLf3LFWnbeKHP8/xPCVVobRCCKEcKfpCrxkZGtC/YTUujvVmxgd1ARi97QQO325m+V+XSE1LVzihEEJojxR9UeA1atSIfv36vXIdM2Mjvm5Rk8vjOjG6VS1inicz8Ne/ePeHrfwacQO1Wq2ltEIIoRwp+qLAe/bsGYmJibla19rMhGnvuXBprDcDGztw9VEcPX85SIM529lz8V4+JxVCCGVJ0ReFUhmroizs0oBzozrQo05Fwm8/xnPpHtou2c2xmw+VjieEEPlCir4o1Kq+Y0WwrwfHh7+Pp1NZ9l76h4Zzd9Bt1QGi7j9VOp4QQuQpKfpCAC7lbNjevxV7B7Whof07bDx9k3d/2Er/taHcfpKgdDwhhMgTUvSF+JfmVUtzeGg7Nn7aHKeSVqz8+zIO0zczcms4jxKSlI4nhBBvRYq+KPD69u2Ll5dXnm1PpVLRsVZ5Tn39ASt6NKakRRFm7T9P1W838e2eMyQkpeTZvoQQQpuk6IsC7/PPP6dHjx55vl1DAwM+qV+FqNHeBHR0w9jAgAk7TlFt+mYWH7lAcmpanu9TCCHykxR9IXJQxNiQL5pW5/I4bya0qU18Uip+G/+m5vdbCD5xjfR0ucZfCFEwSNEXBd6XX37JnDlz8n0/VkVM+KadM5fHejPUw4lbT57hu/owbrO3sSPyjkzwI4TQeYoU/UePHtGsWTOuXLnCjRs36NWrFz4+PkyaNIn09IxpUdetW0fnzp3p3r07+/btAyAxMZGhQ4fi4+ND//79efz4sRLxhY7Zu3cvx48f19r+SlqaMce7HpGjOvCRa2VO34vhgx//pOWiXYRej9ZaDiGEeF1aL/opKSlMnDiRIkWKADB9+nSGDRtGcHAwarWavXv3Eh0dTWBgIGvWrGHFihUEBASQnJxMSEgIDg4OBAcH4+3tzaJFi7QdXwiNSiUsWeXThJNffcAHNcpx8OoD3Of/QaeV+zj3zxOl4wkhxAu0XvRnzJhBz549KVmyJADnzp2jfv36ADRt2pSjR49y+vRpXFxcMDExwdLSkgoVKhAVFUV4eDgeHh6adUNDQ7UdX4gXvFumOL/1bcGBIZ40qWjLlnO3cZ65lU9DjnDjcbzS8YQQQsNImzvbuHEjNjY2eHh4sGzZMgDUajUqlQoAc3Nz4uLiiI+Px9LSUvM6c3Nz4uPjsyzPXDc3zp49m8ctgfDw8DzfphL0oR3JycmA8m0xAwIavcMR+yIsinjAL8evEnLiGl2qFefTmu9QvEju/9yUbkte0pe26Es7QNqii7TVDq0W/Q0bNqBSqQgNDSUyMpJRo0ZlOS6fkJCAlZUVFhYWJCQkZFluaWmZZXnmurlRq1YtTE1N86wd4eHhuLq65tn2lKIv7TAxMSE5OVln2uIG+H2QzpqT15n0RwRrLjzm9+uxfNWsBsOb1cCyiPErX68vnwvoT1v0pR0gbdFFed2OpKSkbDu7Wh3eX716NUFBQQQGBlK9enVmzJhB06ZNCQsLA+DgwYO4ublRu3ZtwsPDSUpKIi4ujitXruDg4EDdunU5cOCAZl19+LDF26tevToVK1ZUOkYWhgYGunrIYAAAGJdJREFUfOhamfOjOjCvUz2KGhsxeddpqn67iXkHI0nK5hr/yTsjWHb6gZbTCiEKC8Uv2Rs1ahTz58+nR48epKSk4Onpia2tLb6+vvj4+NC7d2+GDx+OqakpvXr14tKlS/Tq1Yu1a9fi5+endHyhA9asWcPUqVOVjvFSJkaGDHF34tJYb/zbOZOUms7w345T/bvf+OX4FdL+d7UKZBR8/12n+fHsQybvjFAwtRBCX2l1eP/fAgMDNT8HBQW98Hz37t3p3r17lmVmZmbMmzcv37MJkdcsTI0Z16Y2Axo58N2fZ1l05AKfhhxl5r5zTG3vwonbj5iy+4xmff9dpwGY5OmsVGQhhB5SrOgLkVfWr1/PtWvXCsThnncsijCzgxufe1THf1cEq45dpdNP+1+6rhR+IUReU3x4X4i3NWXKFFauXKl0jNdSobg5P/ZozIBG1V65nv+u0zLUL4TIM1L0hVCQrUWRHNd58jxZC0mEEIWBDO8LoaDMofvMofyXmXcoit0X79HOqSztnOzwqFwSUyNDbUUUQugRKfpCKCy7wj/U3RHHksXYEXWHfZf/YfaBSGYfiMTcxIiW1UrTzsmO9k5lsbexUCK2EKIAkqIvhA74b+Gf2La2ZtmgJo4kpqRx8Op9/oi6wx+Rd9l67jZbz90GoEapYrRzsqOdU1ncZRRACPEKUvSF0BGZRf7u3bsvnLFfxNiQto5laetYloCOcPVRHH9E3tWMAgQcOE/AgfOaUYD21e1o72RHheLmSjRFCKGjpOiLAu/AgQOcOnVK6Rh5YpKnM+HhqTmuV7mEJYPdHRnsnjEKcODK/0YBol4cBWhf/X+jAJVKYiKjAEIUalL0RYFnbW2d5QZNhU0RY0M8ncri6VSW2cCVh3H8EXWHHVF32X/5H2btP8+s/eexMDWiZdX/HwUoL6MAQhQ6UvRFgXfnzh2io6OVjqEzqrxjyRB3J4a4O/E8JZWDVx6wI+oOf0TeYcu52//X3r0HR13eexx/7+Z+21w3AcIlCUkkQAENggVEqLRQe6SKqIUWbLHOlKFV7BnKpYBj0aaIdRTOULAt0x50ZFBR8NgCggQktKnNKIQYJDduScgFQnMhZpOw549N1kRAcv9ldz+vGSZm89vd7zMYPs8+v+fCnpZRgFEDHHMBvpsSy+Q4q0YBRDyAQl9c3n333YfNZmPWrFlGl9LvBPh4O0cBeOBO5yjA33KLSc8vazcKcG/SQGaNGKRRABE3ptAX8SBfHQVwzAUo4e+5xew+eZ7dJ88DMHpAmGNfAI0CiLgVhb6Ihwrw8W5Z6hfLyw/cSX5lNXtzS/jbqWIO55fxYvpnvJj+GSF+Ptyb/OW+AIPDOjYK8Oy+45SUlLO1/x+JIOIxFPoiAkBilIWf323h53c7RgHS8x0rAv6eW8K72ed5N9sxCvCNgWHOfQEmx0fj43X9bt6txwQDDNp3XIcGifQTCn0RuU6Aj7djln9KLK88CHkV1e1WBGSXXmHDoRxC/HyYkdwyFyAlltjQwHaBDzotUKQ/UeiLyC0lWS0kWS384u4UrtqaSC8oY29uMX8/Vcw72ed4J/scANHBfpTXNlz3fAW/SP+g0BeXl5aWRkFBgdFleIxAX2/uS4nlvpRY7HY7eZU17M0tZtPRUxReqr3p8xT8IsZT6IvLu++++8jKyjK6DI9kMplItlpItlqoqrd97WmBAH/OzKPO1sTk+GgmxVk7dLSwiPQchb6I9IhbHRM8yBJAWc0Xzr0BAG6zWpgcH83k+GimJFgZHhmCyWTqs5pFPI1CX1ze7Nmzqamp4dChQ0aX4vFuFvytpwbWNTTyr/OXyCgq52hhOf88W8m2f+Wz7V/5AMSE+DMpLpop8VYmx0czLjbihqsDRKRrFPri8s6ePYvNZjO6DGnxdccEB/n5MD1xANMTBwDQfO0a2aVXHJ2Alo5A24mBgb5e3DXU0QGYFG/lrmFRWPx9DWiViHtQ6ItIj/u6Y4Lb8jKbGRcbwbjYCJZMGYHdbudsVR1Hi8o5VlRBRlE5H+Zf5MP8iwCYTSbGDgpncstIwOT4aGJDA/ukTSLuQKEvIr2io8cEt2UymYiLCCYuIpgfpSYAcPlqA/844+gAHDtTwb/OVfJJ8WX+5+jnAMRFBH05LyA+mpToUMxmzQsQuRGFvoj0axGBfnxv5GC+N3IwAA1NzWSdv0RGUYVjROBMOa9nFfF6VhEA4QG+TIq3MjnO0REYPyQSfx+dHSACCn0RcTF+3l5Mio9mUnw0yxjFtWt2Pq+o5mhRORktf97/rJj3PysGwNfLzJ1DIp3zAibFRRMZ5Nfh99MZAuJOFPri8mbPnk1ZWZnRZYhBzGYTKTGhpMSE8sRdSQCUVl8lo2VOQEZROf84W0nGmQpoWeAxMia0zS0BK3ERwTdcKqgzBMTdKPTF5a1bt06b80g7Ay2BzB07jLljhwFQ80UjmecqOdaySuCfZyv5rCyPP/4zr+X6AGcHYHJ8NGMGhvP8gWydISBuR6EvIm4vxN9xMNCM5IEANDVf43hJlXOpYEZRBW8dP8tbx88C4ONlorHZft3rKPjF1Sn0xeWlpaVRWlpKaqpuukrHeHuZSR0SSeqQSJ6cmoLdbqfoci1Hi8rZeCSXT4qrbvrc3+w/ga2pmee/d0cfVizSMxT64vJ27NihzXmkW0wmEwmRISREhlB0qfZrQx/ghUM5fFRYzrTEAdwzPIZJ8VYCfPTPqfR/+r9URKSNW50hMCnOSmPzNefkwOcPZOPrZWbisCimDR/AtMQY7hpm1TJB6ZcU+iIiX3GrMwQAqr+w8VFhOen5ZRwuuEhGUQUfFZaz7gPw8zbzzWFW7hkew7TEAUwcFoWftzoBYjyFvojIDXzdGQIAFn/fdpsGXam38VFhGen5ZaTnX+RwYRnpBWU8u/8E/t5eTIqzMi0xhnuGD2DC0Eh81QkQAyj0RURuoqNnCACEBfhy/6gh3D9qCODYPvhIQRmHCxwdgS/PEDhOgI+jEzA9cQDTEgcwfkikThOUPqHQF5dntVqpq6szugxxU105QwAc2wc/8I2hPPCNoQBU1n7BkcJy0vMvkl5wkYN5jj8AQb7eTI6PZtrwGKYlxpA6OBJvdQKkFyj0xeUdOHBAm/NIvxcV7M+cMUOZM8bRCSivqedwYTmH8y+SXlDG/s9L2P95CQDBft5MiY9mesvqgNtjI9QJkB6h0BcRMUB0SAAPjx3Gwy27Bl6srnfcCii4yOH8MvaeKmHvKUcnwOLv4+wETEuMYeygcLzM6gRI5yn0xeWlp6eTl5enzXnEpQ2wBPDo7XE8enscACX/uUp6gWNlQHp+GX/LLeZvuY5DhMICfLk7ofV2wADGDAzv0HHCOjxIFPri8p566ilsNhtPPPGE0aWI9JhBoYHMvyOe+XfEA3DhSh3pBS0rAwrKeC/nAu/lXAAcxwlPHR7D9JbVAaMHhF3XCdDhQQIKfRERlzA4LIgfpSbwo9QEAM5erm0ZCXB0BHafPM/uk+cBiAz0c3YCpiUO4M1Pz7Dug2zna+kMAc+l0BcRcUHDIoJ5LCKYx+4cDsCZy7Ucyr/o3CfgnexzvJN97qbPV/B7JoW+iIgbiIsI5icTEvnJhETsdjuFl2r55e6P+b/Pim/6nN/sP8GxonL+e/ooxg4KJyYkoA8rFiMo9EVE3IzJZGJ4VAh3DI782tAHOJB3kQMt+wVEB/szZlA4YweF842Bjq8joi3aPdCNKPRFRNzUrQ4PWjL5NqYOj+FESRUnSqs4UVLFgdOlHDhd6rzGx8tMSnQoYwaFM2ZgmLNTEK1RAZek0BeX9+abb5KTk2N0GSL9UkcOD5rbslcAOM4QyG7pALR2BLJLr3CitP1xwzEh/owZGO7oDLR0BG6zalSgv1Poi8tLTk6mpqbG6DJE+q1bHR7UlmMPgBjuTohxPtZ87RoFl2o5XlJFdkkVx1s6BB+cLuWDr4wKjIwJdd4aaB0d0KhA/6HQF5dns9lobGw0ugyRfq0zhwd9lZfZTLLVQrLV4txBEByjAo6RgJaOQEkVJy9e4XhJFa+12Rl7QEhAu9sDYwaFMyI6tFuHDGmjoa5R6IvLu/POO7HZbOTm5hpdiki/1tXDg24mrGVToKnD248K5FfWcKL0CidKLjtGB0qvtDtbAMC3dVSg5dZA660Ca7D/Ld9XGw11nUJfRER6jJfZzG3RodwWHdpuVKDqaoNjbkDL7YHsUseowKclVWxv8/yBloDrbg/c1mZUoG3gg/Yb6CyFvoiI9Lrwll0CbzQq0HproHXi4I1GBUYNCKP52jVOlF657rUV/B2n0BcREUO0HRV4ZFyc8/Gqqw3O2wMnShwrBz65cJlmu/2mr/Wb/Sc4WXqFlTNGkxRlIcTfpw9a4HoU+iIi0q+EB/pxz/AY7mkzKvDM3k95rs35ATeyK/scu1q2Ho4J8ScpykKSNYSkKAuJrV+jQgj09dzo89yWi4iIy3h21jjMJtNNNxqad3scE4dFkVdRQ15lDXkV1Rw7U8HRovLrro0NDSQpKoREawjJURYSrRaSokJIiAzB38e99xlQ6IvL++Uvf8m5czc/WERE3ENHNhpqq6GpmaJLteRVVpNfWUNeRQ35ldXkVdY4jikuKGt3vckEQ8OCSIwKIalliWLrf8dHBHdrieHN9PXSQ4W+uLzHHnuMrKysW18oIi6vMxsN+Xl7MSImlBExodf9rL6xiYJKx6hAfkVNm45BNQfzLnKw5TyCVl5mE3HhwS23CUJabh04bh8MCw/Cy9z5DoERSw8V+iIi4lK6s9FQqwAfb0YPDGf0wPDrflbb0OjoAFTWkF9R3e7rvlMl7PvK9T5eZhIigr+cN9DyNdlqYXBoIGaz6br3MGrpYZ+GfmNjI6tWraK4uBibzcbixYtJTExkxYoVmEwmkpKSeOaZZzCbzezcuZMdO3bg7e3N4sWLmT59Ol988QXLli3j0qVLBAUFsX79eiIiIvqyCdIPPf7441RVVbFr1y6jSxGRPtLTGw21Feznw7jYCMbFXp8v/6m3OecMODoG1c6Rgs8rqoH2pxr6e3sxPCqYxChLyzwCC8eKyvnffxde99p9Efx9Gvp79uwhLCyMDRs2UFVVxYMPPsiIESNYunQpEydOZO3atRw8eJBx48axfft23n77bRoaGpg/fz6TJ0/mjTfeIDk5mV/84he8//77bN68mdWrV/dlE6Qf+ve//43NZjO6DBHxAKEBvowfEsn4IZHX/ezy1QbyKqo53Tp3oM0cgpyL/+nQ6/d28Pdp6M+aNYuZM2c6v/fy8iInJ4cJEyYAMHXqVDIyMjCbzdx+++34+vri6+vL0KFDOXXqFFlZWfz0pz91Xrt58+a+LF9EROSmIgL9mDjMysRh1naP2+12Kmq/IK+yhg2Hcngv54JBFfZx6AcFBQFQW1vLk08+ydKlS1m/fj0mk8n585qaGmprawkJCWn3vNra2naPt17bESdPnuzhluA2E8fcoR2tn/LdoS2t1Jb+x13aAWqLUfyBNWMtxJii+NPJyhte89PRUfxXVFOvtavPJ/KVlpayZMkS5s+fz/3338+GDRucP6urq8NisRAcHExdXV27x0NCQto93nptR4wePRo/P78ea0NWVhapqa5/tJO7tMPX1xebzeYWbQH3+XsB92mLu7QD1Jb+YGuqY7Z+R5cedlZDQ8NNP+z2/KLDr1FZWcmiRYtYtmwZc+fOBWDkyJFkZmYCcOTIEcaPH8+YMWPIysqioaGBmpoaCgoKSE5O5o477uDw4cPOa13xL1tEROSZmWNZ+50xzu97KvBvpU8/6W/ZsoXq6mo2b97svB//61//mueee46XXnqJhIQEZs6ciZeXFwsWLGD+/PnY7Xaefvpp/Pz8mDdvHsuXL2fevHn4+Pjw+9//vi/Ll37qm9/8JpcuXTK6DBGRTumJpYed1aehv3r16hvOtn/ttdeue+yRRx7hkUceafdYQEAAGzdu7LX6xDVt2bLFpe7riYi06s2lhzfSp8P7IiIiYhyFvri8P/3pT+zevdvoMkRE+j2Fvri8TZs28eabbxpdhohIv6fQFxER8RAKfREREQ+h0BcREfEQCn0REREP0efb8PYlu90O0CsnsDU0NPT4axrBHdoRGRlJY2OjW7SlldrS/7hLO0Bt6Y96sh2tmdeagW2Z7Dd61E3U1NRw+vRpo8sQERHpc8nJye0OrwM3D/1r165RV1eHj4+P8yQ/ERERd2a322lsbCQoKAizuf1dfLcOfREREfmSJvKJiIh4CIW+iIiIh1Doi4iIeAiFvoiIiIdw63X6PamxsZFVq1ZRXFyMzWZj8eLF3HvvvUaX1SXNzc2sXr2aoqIivLy8SEtLY+jQoUaX1WWXLl1izpw5bNu2jeHDhxtdTpc98MADzuU1gwcPJi0tzeCKum7r1q18+OGHNDY2Mm/ePB5++GGjS+qSXbt28c477wCOddS5ublkZGRgsVgMrqzzGhsbWbFiBcXFxZjNZtatW+eSvy82m42VK1dy/vx5goODWbt2LXFxcUaX1WnHjx/nxRdfZPv27Zw9e5YVK1ZgMplISkrimWeeuW7WfU9R6HfQnj17CAsLY8OGDVRVVfHggw+6bOgfOnQIgB07dpCZmUlaWhp/+MMfDK6qaxobG1m7di3+/v5Gl9ItrRtzbN++3eBKui8zM5NPPvmEN954g/r6erZt22Z0SV02Z84c5syZA8Czzz7LQw895JKBD3D48GGamprYsWMHGRkZvPzyy2zatMnosjpt586dBAYGsnPnTgoLC1m3bh1//vOfjS6rU/74xz+yZ88eAgICAEhLS2Pp0qVMnDiRtWvXcvDgQb797W/3yntreL+DZs2axVNPPeX83svLy8BqumfGjBmsW7cOgJKSEqKiogyuqOvWr1/PD37wA6Kjo40upVtOnTpFfX09ixYtYuHChXz66adGl9RlR48eJTk5mSVLlvCzn/2MadOmGV1St2VnZ5Ofn8+jjz5qdCldFh8fT3NzM9euXaO2thZvb9f8zJefn8/UqVMBSEhIoKCgwOCKOm/o0KHtOlw5OTlMmDABgKlTp3Ls2LFee2/X/Fs3QFBQEAC1tbU8+eSTLF261OCKusfb25vly5fzwQcfsHHjRqPL6ZJdu3YRERHB3Xffzauvvmp0Od3i7+/P448/zsMPP8yZM2d44okn2Lt3r0v+w1xVVUVJSQlbtmzhwoULLF68mL1797r0Bllbt25lyZIlRpfRLYGBgRQXF/Pd736XqqoqtmzZYnRJXZKSksKhQ4eYMWMGx48fp6ysjObmZpf6IDZz5kwuXLjg/N5utzt/P4KCgqipqem199Yn/U4oLS1l4cKFfP/73+f+++83upxuW79+Pfv27WPNmjVcvXrV6HI67e233+bYsWMsWLCA3Nxcli9fTkVFhdFldUl8fDyzZ8/GZDIRHx9PWFiYy7YlLCyMKVOm4OvrS0JCAn5+fly+fNnosrqsurqawsJC7rrrLqNL6Za//OUvTJkyhX379rF7925WrFjhkvvWP/TQQwQHB7Nw4UIOHTrEqFGjXCrwb6Tt/fu6urpevYWk0O+gyspKFi1axLJly5g7d67R5XTLu+++y9atWwEICAjAZDK55C/N66+/zmuvvcb27dtJSUlh/fr1WK1Wo8vqkrfeeovf/e53AJSVlVFbW+uybUlNTeWjjz7CbrdTVlZGfX09YWFhRpfVZR9//DGTJk0yuoxus1gszomioaGhNDU10dzcbHBVnZednU1qairbt29nxowZDBkyxOiSum3kyJFkZmYCcOTIEcaPH99r7+V6Y4cG2bJlC9XV1WzevJnNmzcDjskYrjiB7Dvf+Q4rV67khz/8IU1NTaxatQo/Pz+jy/Joc+fOZeXKlcybNw+TycRvf/tblxzaB5g+fToff/wxc+fOxW63s3btWpfsVLYqKipi8ODBRpfRbT/+8Y9ZtWoV8+fPp7GxkaeffprAwECjy+q0YcOG8corr7Bt2zZCQkJ4/vnnjS6p25YvX86aNWt46aWXSEhIYObMmb32Xtp7X0RExENoeF9ERMRDKPRFREQ8hEJfRETEQyj0RUREPIRCX0RExEMo9EWkx2VmZrJgwQKjyxCRr1Doi4iIeAiFvoj0qr/+9a8sWLCA+vp6o0sR8XiuueWXiLiEXbt2sX//fl599VXnMaIiYhx90heRXnH69GnWrFnDwoULnadUioixFPoi0iuCgoLYtGkTL7zwgkue4ijijhT6ItIrYmNj+da3vsWECRPYuHGj0eWICAp9Eellv/rVr3jvvffIyckxuhQRj6dT9kRERDyEPumLiIh4CIW+iIiIh1Doi4iIeAiFvoiIiIdQ6IuIiHgIhb6IiIiHUOiLiIh4CIW+iIiIh/h/vCCCwXHM1LYAAAAASUVORK5CYII=\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "plot_model(kmeans, plot = 'elbow')" ] }, { "cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [ { "data": { "text/html": [ " \n", " " ] }, "metadata": {}, "output_type": "display_data" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "plot_model(kmeans, plot = 'silhouette')" ] }, { "cell_type": "code", "execution_count": 13, "metadata": {}, "outputs": [ { "data": { "text/html": [ " \n", " " ] }, "metadata": {}, "output_type": "display_data" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "plot_model(kmeans, plot = 'distance')" ] }, { "cell_type": "code", "execution_count": 14, "metadata": {}, "outputs": [ { "data": { "text/html": [ " \n", " " ] }, "metadata": {}, "output_type": "display_data" }, { "data": { "application/vnd.plotly.v1+json": { "config": { "plotlyServerURL": "https://plot.ly" }, "data": [ { "alignmentgroup": "True", "bingroup": "x", "hovertemplate": "Cluster=%{x}
count=%{y}", "legendgroup": "Cluster 0", "marker": { "color": "#636efa", "opacity": 0.7 }, "name": "Cluster 0", "offsetgroup": "Cluster 0", "orientation": "v", "showlegend": true, "type": "histogram", "x": [ "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0" ], "xaxis": "x", "yaxis": "y" }, { "alignmentgroup": "True", "customdata": [ [ "Honduras", 2.86657957, 2.460607584, 2.37295217, 2.92390839, 2.902757343, 3.592970163, 3.6164590089999997, 3.906168524, 4.7330869369999995, 4.207177311000001, 3.905898653, 3.48897019, 3.63946928, 3.7255735989999996, 4.554171531000001, 4.215610713999999, 3.916841875, 4.453647583, 4.457074848, 4.41783425, "Cluster 0" ], [ "Dominica", 4.159861137, 4.217261905, 4.370036617, 4.155978162, 4.149951581, 3.308396479, 3.23826402, 3.290272803, 3.173775978, 2.9741580819999998, 3.0197000010000004, 3.094683051, 3.0779197789999997, 2.96951027, 3.6526046819999998, 4.047182568999999, 3.9743900930000002, 3.6693638839999996, 3.812216844, 3.767972854, "Cluster 0" ], [ "Djibouti", 2.384148412, 2.318293685, 2.83292067, 3.6097572010000003, 4.407148156, 3.9005062999999995, 3.4863802660000003, 3.516449396, 4.167696582, 4.600888287, 4.939467764, 4.702732187, 5.337600592, 5.745632858, 5.957206032, 5.149939099, 5.019683712, 5.25888563, 5.322417486, 6.750847587000001, "Cluster 0" ], [ "Samoa", 3.390716641, 3.010723905, 3.338794876, 3.926948968, 4.269501817, 4.11544971, 3.848022139, 3.940851472, 3.64949145, 3.596860784, 3.5879326000000002, 3.925566538, 4.509782876, 3.8248453000000002, 4.341031427, 4.985224399, 5.101682632, 4.337641237, 6.216667467000001, 6.536868986, "Cluster 0" ], [ "San Marino", 4.5639391830000005, 4.383787117, 4.3124433369999995, 4.248369167, 4.300679912, 4.385399883, 4.296809438, 4.26944922, 3.90726845, 3.832377435, 3.7497484489999997, 3.52237298, 3.54154425, 3.616263881, 4.204062797, 4.647450421, 5.322357589, 5.865948338, 5.656072233, 5.736058813, "Cluster 0" ], [ "Sao Tome and Principe", 2.805079353, 1.966810767, 2.938184371, 2.9092363480000003, 3.8562996519999997, 3.823975859, 3.792038305, 3.8456142939999998, 6.03861594, 5.1383615769999995, 5.29330423, 2.5410377769999997, 2.13790765, 1.592076218, 2.507352864, 2.537331158, 2.6053125880000003, 2.48230437, 3.5868170939999997, 3.612254726, "Cluster 0" ], [ "Colombia", 3.7205698160000003, 5.067606606, 5.593914054, 6.103439101, 6.459251592, 4.683826863999999, 4.690523841, 4.549736058, 4.899277437, 4.082866763999999, 4.316017077, 4.535042305, 4.539526519, 4.698007256, 5.148273784, 4.9756529380000005, 5.016164698, 5.277512194, 5.2189183660000005, 5.409943154, "Cluster 0" ], [ "Chile", 2.483034377, 2.667579501, 2.722896255, 2.999279862, 3.188783313, 3.332061767, 3.484542158, 3.529890881, 2.687549761, 2.63814344, 2.536291524, 2.517617347, 2.655656258, 2.942588718, 3.468102151, 3.294925632, 3.3326392360000003, 3.4761647210000004, 3.632821452, 3.8513094239999996, "Cluster 0" ], [ "Cabo Verde", 4.252399745, 3.9401934880000002, 3.862837242, 3.92627046, 3.424656164, 3.5249331219999998, 3.9135356839999997, 3.893120524, 3.746871642, 3.7893525489999997, 3.649990513, 3.962680293, 3.3863364560000004, 3.03734974, 3.239265323, 3.431766845, 3.3357602589999997, 3.33864148, 3.120439872, 3.557226753, "Cluster 0" ], [ "Solomon Islands", 3.013517642, 2.7842825980000003, 3.047041542, 3.2772146280000003, 3.544792113, 4.299521273, 6.162337203, 5.8209578, 5.537965968, 5.180937453, 7.370558602000001, 6.205507441, 5.9541656089999995, 5.522732105, 7.453790237000001, 7.022895121, 4.696250372, 5.0946949560000006, 4.99069527, 4.640482319, "Cluster 0" ], [ "Bulgaria", 3.515523463, 3.1825410080000003, 3.397999988, 3.262490099, 3.883886627, 3.6982741960000003, 4.2243892810000006, 4.536791795, 4.617962963, 4.30515357, 4.312971455, 3.800812847, 3.730705859, 3.8703163560000005, 3.75184985, 4.0342301, 3.7596558460000002, 3.9998185019999997, 4.1228617419999996, 4.60763146, "Cluster 0" ], [ "South Africa", 3.4277404380000003, 3.8406204760000002, 3.7549938330000003, 3.584417155, 3.418376453, 3.290839079, 3.330803407, 3.231917455, 3.3379947910000003, 3.218086131, 3.315898573, 3.360932915, 3.3985272369999997, 3.595345502, 3.94739833, 3.990053885, 4.1340834939999995, 4.276293506, 4.204760905, 4.24326873, "Cluster 0" ], [ "Brazil", 2.800558403, 2.700450075, 2.874414942, 2.7969900130000003, 2.9525750339999997, 2.832471845, 3.040958916, 3.1829922930000003, 3.080328175, 3.323675591, 3.43190885, 3.4926520919999997, 3.4551482289999997, 3.61158219, 3.8413556489999996, 3.786139623, 3.6540019860000004, 3.66135204, 3.827307012, 3.831759885, "Cluster 0" ], [ "Botswana", 2.126873521, 2.123124439, 2.429731822, 2.1792576759999998, 2.163569841, 2.8998524210000003, 4.146457238, 4.894689856, 2.969796404, 3.888095917, 4.090479196, 3.479114149, 3.3157118810000004, 3.9283219289999995, 4.494537231, 3.544461785, 3.236016942, 3.9553822110000003, 3.50694528, 3.193884455, "Cluster 0" ], [ "Bolivia", 2.112215194, 2.9782255189999995, 2.66726091, 3.122442061, 3.602860899, 3.245343618, 3.744167609, 4.101807461, 3.4962789219999997, 3.492276415, 3.860740789, 3.521340785, 3.408827783, 3.4068432439999996, 3.9482262710000002, 3.662996725, 3.7521416939999996, 3.772366172, 4.238349186000001, 4.565377537, "Cluster 0" ], [ "Bhutan", 2.655671226, 4.92248937, 5.589715842, 5.420760961, 5.060485995, 5.325051654, 4.849893798, 6.60698513, 3.749019455, 3.193554605, 4.166375755, 4.29057998, 5.118893938, 5.5624086660000005, 4.8912954719999995, 4.544794957, 4.142893462, 2.7008609310000002, 2.804824773, 2.6150396540000003, "Cluster 0" ], [ "Belarus", 4.793950729, 4.696646664, 5.427282394, 4.588919064, 4.7158020689999995, 4.626454599, 4.739935352, 4.560548727, 4.8657554869999995, 4.922950998, 5.022738287, 4.4504001230000005, 4.451424325, 3.871576451, 3.895442402, 4.3148055439999995, 3.472557647, 3.8657578999999997, 4.022291167, 3.7417552510000003, "Cluster 0" ], [ "Barbados", 3.541707878, 3.461739847, 3.3299528030000003, 3.1894177860000004, 3.277842886, 3.392050008, 3.6966440169999997, 3.962990388, 3.8432781069999997, 3.7180714760000004, 3.4632789969999997, 3.415845805, 3.7583009119999997, 4.056312343, 4.144961775, 4.009928747, 4.155989917, 4.841513416000001, 4.899894263, 4.744632219, "Cluster 0" ], [ "St. Lucia", 3.044466017, 3.540413289, 3.011746972, 3.0899609160000003, 3.0860480160000003, 2.8750947069999997, 3.2434443760000002, 3.2677446619999997, 2.943800165, 2.9480524710000005, 2.8950996630000003, 3.1148809789999996, 2.979865278, 3.573426446, 4.401846474, 4.034045185, 3.262981082, 4.207408698, 3.535976399, 3.599295246, "Cluster 0" ], [ "St. Vincent and the Grenadines", 3.78040306, 3.7626628060000002, 3.905015857, 3.379166091, 3.4596669789999996, 3.067373134, 2.950634745, 3.231535161, 3.2055298039999998, 3.022706918, 2.9590426830000003, 3.1835519619999997, 3.2201201989999997, 3.946405784, 4.33049775, 3.8582360810000003, 4.092983481, 4.403446842, 4.3086, 4.385223105, "Cluster 0" ], [ "Russian Federation", 3.962243165, 3.9654738039999997, 5.026415056, 4.308860664, 3.585441199, 3.2468243560000003, 3.328637239, 3.530756868, 3.298708379, 3.090936853, 3.2304787619999997, 3.35436078, 3.452891195, 3.520137222, 4.159022037, 3.696945486, 3.58245544, 3.795838898, 3.7073014489999996, 3.6909228080000003, "Cluster 0" ], [ "Suriname", 4.471885239, 3.145059885, 5.651223383, 7.115667758, 5.196504662, 5.6175626670000005, 4.184378634, 3.551353558, 3.3571448680000002, 3.3271645260000002, 3.469387753, 3.177793139, 2.9772981, 2.709678901, 3.196518003, 2.930358668, 2.921405525, 3.215861695, 3.202562051, 2.94062408, "Cluster 0" ], [ "Romania", 2.397777108, 2.353719196, 3.3087963410000003, 2.8352913060000002, 3.344160172, 3.5136997310000004, 3.534191634, 3.75783267, 4.4933842660000005, 4.0521396, 4.398723805, 4.030785785, 4.278891084, 4.374197997, 4.391968392, 4.68660531, 4.37807867, 4.397386285, 4.520294731, 4.47447755, "Cluster 0" ], [ "Estonia", 5.671494836, 5.809624371, 5.51790868, 4.797024971, 4.536437438, 4.075514834, 3.817487064, 3.735725858, 3.775009168, 3.8771176830000003, 3.850041558, 3.6735492119999997, 3.899242751, 4.712423412, 5.216716763, 4.9273468000000005, 4.625885477, 5.115761648, 5.138603368, 5.028395902, "Cluster 0" ], [ "Moldova", 5.815895061, 6.709797385, 6.075025236, 4.323722867, 2.901963967, 3.229712857, 3.2075372680000003, 4.040610039, 3.9671964969999998, 4.182380118999999, 4.176139383, 4.718684365, 4.9197080269999995, 5.389847747999999, 6.0594371979999995, 5.621478753, 5.311539911000001, 5.517522784, 5.031340165, 5.303988304, "Cluster 0" ], [ "Malawi", 1.865213739, 1.26338764, 1.600434006, 1.88109678, 2.274782235, 2.7785565489999997, 2.215081497, 2.912550035, 4.578496658, 5.71696331, 6.066366509, 6.194908259, 4.41611059, 6.096624721, 6.185752937, 6.339254893, 6.933702546, 6.765934565, 5.793450792000001, 5.998620835, "Cluster 0" ], [ "Monaco", 2.7828046389999996, 2.722031577, 2.8387481, 2.760402313, 2.989907557, 2.8661872330000002, 2.911772468, 2.956788105, 3.466538501, 3.5451300519999998, 3.528936649, 3.360320254, 2.952654785, 3.1897775960000003, 3.8011578999999998, 3.896460373, 3.705257089, 3.764195008, 3.554960152, 3.841098459, "Cluster 0" ], [ "Macedonia, FYR", 4.996397418, 5.135953651, 5.5549962939999995, 6.489321372000001, 5.341639155, 4.787766545, 4.631112465, 5.191571141, 5.226034904, 5.039289244, 4.781614783999999, 4.87674973, 4.445867739, 4.7474917, 4.456857728999999, 4.292903636, 4.272932737, 4.42539678, 4.204269092, 4.1014206380000005, "Cluster 0" ], [ "Lithuania", 3.985217925, 3.931004202, 4.1614319669999995, 4.616115978, 4.64619213, 4.501929246, 4.5479188619999995, 4.792172072, 4.929875383, 3.83247282, 3.953664458, 4.3067158469999995, 4.542177272, 4.784195764, 5.485546619, 5.020955675, 4.739136876, 4.349539439, 4.312630815, 4.446889612, "Cluster 0" ], [ "Lebanon", 4.242476487, 4.991736717, 5.0616362619999995, 3.144910175, 2.943009427, 3.20634861, 3.733963909, 3.735593505, 3.496375815, 3.711970773, 3.7443329469999997, 3.631882475, 3.7155355410000004, 3.144813413, 3.123417148, 2.708551485, 2.7443969960000003, 3.235855284, 3.054229695, 3.043924599, "Cluster 0" ], [ "Latvia", 3.820164845, 3.525870433, 3.4596156560000004, 3.6262617789999996, 3.728657225, 3.2654466760000003, 3.1577079460000004, 3.2790679739999997, 3.2495228560000005, 3.684698103, 3.637151355, 4.357857145, 4.255979, 4.124515045, 4.070041625, 3.9402581469999998, 3.873401416, 3.576955393, 3.539843039, 3.7152319819999997, "Cluster 0" ], [ "Montenegro", 5.196505917, 5.196505919, 5.196505921, 5.1965059160000004, 5.196505922, 5.19650592, 5.9571847689999995, 5.880242121, 6.663011347, 6.232366722999999, 6.022940018, 5.613499871, 4.5478217039999995, 3.9917967869999997, 3.61393065, 4.173469442, 4.186590285, 4.4723783919999995, 3.719088236, 3.66738093, "Cluster 0" ], [ "Mozambique", 3.3965561789999996, 2.598261241, 2.955873935, 2.9684768339999996, 3.5660974999999997, 4.311883073, 3.9675961089999996, 4.488862031, 4.108240978, 3.521927947, 4.306135066, 3.950981842, 3.1000050960000003, 2.606804503, 2.515159938, 3.0181028260000002, 2.6645777330000002, 2.776382768, 3.1190876260000002, 3.936734776, "Cluster 0" ], [ "Namibia", 4.413658721, 4.750908805, 4.924511725, 4.952596648, 5.111744353, 4.214029426000001, 3.474246902, 3.576968668, 3.722335405, 3.207038753, 3.579619723, 3.129120087, 3.800771171, 3.89854309, 4.417229575, 4.594429367, 5.315764413999999, 4.854097749, 5.029136422, 5.357137699, "Cluster 0" ], [ "Jordan", 5.328898363, 5.441182157, 5.116392745, 5.300589761, 4.991069703, 4.635309347, 4.786093096, 4.810691426, 4.451036994, 4.692325909, 4.761008321, 4.48990028, 4.994181963, 5.431250455, 6.6959843029999995, 5.921295616, 5.905862126000001, 5.5093025760000005, 4.873555443, 5.1931019460000005, "Cluster 0" ], [ "Israel", 4.950145432, 5.108144225, 5.144840787, 4.762189233, 4.6017821119999995, 4.460361462, 4.719172153, 4.737818754, 4.587586374, 4.473436246, 4.408425818, 4.702560226, 4.56088595, 4.471592985, 4.560773264, 4.6122764819999995, 4.618524658, 4.865016995, 4.857808386, 4.751695808, "Cluster 0" ], [ "Nicaragua", 4.1750942769999995, 3.7946175460000005, 2.577101237, 2.772020641, 2.433647188, 2.881102037, 2.8359501239999996, 2.995229948, 3.46223108, 3.389498166, 3.45056744, 3.473051685, 3.792404173, 3.830040753, 4.286697443, 4.288147231, 4.081974306, 4.260162572, 4.420152655, 5.095797672, "Cluster 0" ], [ "Hungary", 6.06578493, 5.707631445, 5.48077096, 5.293047243, 5.215692477, 4.992262794, 4.907747893, 5.241660919, 5.986829456000001, 5.625904986, 5.798315898999999, 5.651159262, 5.050828075, 4.9125672730000005, 4.958614911000001, 5.117494816000001, 5.029887063, 4.910106031000001, 4.905828404, 4.8830819089999995, "Cluster 0" ], [ "Guyana", 4.1236919819999995, 4.042182563, 4.267222814, 4.314013546, 3.815805252, 4.954943485, 4.898010308, 4.94658054, 4.749728887, 4.548307265, 4.359658645, 3.044944275, 4.685796052, 5.5972460139999995, 5.30091141, 4.460583707, 4.57147769, 4.339437853, 2.896153441, 3.119698091, "Cluster 0" ], [ "Grenada", 3.0064343160000004, 3.0167429230000002, 3.157869167, 3.151488805, 3.7073192410000004, 3.4469993260000003, 4.513238797, 3.5245498769999997, 3.055066908, 2.7005638910000003, 2.918936395, 3.208181759, 2.897890968, 2.691541613, 3.073334628, 3.100526247, 3.040190628, 3.045941945, 2.7824442680000003, 2.827357413, "Cluster 0" ], [ "Panama", 5.246581756, 4.628785357, 4.875049583, 4.727189573, 4.543351694, 5.284626305, 5.179758628, 5.544147842, 5.046701513, 5.688574188, 5.205403273, 4.7207796019999995, 4.048878178, 4.666452338, 5.63276516, 5.6500218460000005, 5.08973241, 4.9715198019999995, 5.804010025, 5.878366088, "Cluster 0" ], [ "Papua New Guinea", 2.449537747, 2.585706214, 2.9792040010000003, 3.16658124, 3.373244226, 3.2561626969999997, 5.895055792999999, 6.716728432999999, 6.024920708, 7.601456272999999, 5.47058434, 5.05912292, 3.123843205, 3.0754131780000002, 3.2208812860000005, 3.1834109230000003, 4.041347222, 3.653279542, 3.906003811, 3.46554272, "Cluster 0" ], [ "Poland", 3.905037381, 4.224738069, 3.983748404, 3.828606974, 4.0329012760000005, 3.852713136, 4.210391357, 4.497808461, 4.349887106000001, 4.242001236, 4.298902044, 4.313210083, 4.4203601710000004, 4.935315917, 5.097181114, 4.902807428, 4.710355764, 4.577515541, 4.534424797, 4.507639603, "Cluster 0" ], [ "El Salvador", 2.456765433, 3.106327227, 3.204772995, 3.68357541, 3.6517329339999995, 3.796302763, 3.753448667, 3.8056802210000003, 3.750173665, 3.6353041960000003, 3.8125530939999996, 4.153138804, 3.7447696460000004, 3.706714781, 4.133696927, 4.29012069, 4.327903341, 4.2104711539999995, 4.632291908, 4.4695083239999995, "Cluster 0" ], [ "Argentina", 4.966443086, 4.631641218, 4.553044297, 4.624211713999999, 5.152315686000001, 4.9658035819999995, 5.065933992, 4.4529400489999995, 4.251023183, 3.522396758, 3.6642338480000003, 3.654868936, 3.7830748410000004, 4.121097352, 5.040785799, 4.163482345, 3.745392503, 2.9589508739999997, 2.735022008, 2.652673798, "Cluster 0" ], [ "Seychelles", 4.22296599, 4.451643869, 4.820469327, 4.185799521, 4.236396955, 3.785614663, 3.758676506, 3.636458774, 4.145567132, 3.812610542, 3.620129416, 3.4579109889999997, 3.060728801, 2.405118358, 2.413078163, 3.2088597510000003, 3.1987716789999996, 3.797892539, 3.335699444, 3.107242732, "Cluster 0" ], [ "Swaziland", 2.832071581, 3.0579196060000005, 2.812078497, 2.879100714, 3.003066511, 2.9584121, 2.933657283, 3.0504573010000002, 3.719224901, 3.7224765680000003, 4.591988907, 4.559222042, 4.817315257, 5.70029508, 5.768594858999999, 5.9652663839999995, 5.971125925, 6.295393133999999, 7.374204077999999, 7.004909495, "Cluster 0" ], [ "Small states", 3.0834417839999997, 3.155744645, 3.18509596, 3.337760802, 3.2314720930000003, 3.053471183, 3.067515292, 3.2739580310000003, 3.46788155, 3.3720450910000004, 3.17828889, 2.9852425910000004, 2.963611867, 2.787731202, 3.320674555, 3.01892481, 2.816008951, 3.0011255610000003, 3.061103031, 2.9930888060000003, "Cluster 0" ], [ "Tonga", 2.670824514, 2.7968637689999998, 3.040161598, 3.2127216389999997, 3.763892167, 3.350358074, 4.284100434, 3.8079197839999996, 4.233041111, 4.050934622, 5.680380494, 4.879183916000001, 4.762818289, 4.186537045, 3.705109958, 3.6948683410000003, 3.223524387, 3.640530345, 4.0556243080000005, 4.265698947, "Cluster 0" ], [ "Vanuatu", 2.139305264, 1.749746805, 2.296830253, 3.038570387, 2.639952543, 2.73692934, 2.7885501360000005, 2.9076602460000003, 3.4189271389999996, 3.524656985, 3.292996247, 3.427445317, 3.161681536, 3.1798915739999996, 3.4023226980000003, 4.182597639, 3.3201783469999997, 3.167396258, 3.391475272, 4.510749546, "Cluster 0" ], [ "Pacific island small states", 4.0892714539999995, 3.644414077, 3.8171409, 3.801815827, 3.794036075, 4.478110937, 4.4304985530000005, 4.3275116780000005, 4.223171686000001, 4.262646193, 4.517164031, 4.531308472, 4.42810272, 4.253259024, 4.7700180130000005, 4.858082923, 4.239523762, 4.210439148, 4.497317273, 4.57632822, "Cluster 0" ], [ "Other small states", 3.116200718, 3.224322602, 3.2162667689999997, 3.450544585, 3.380267205, 3.0803314939999997, 3.1597630889999997, 3.3745049989999996, 3.6685363239999997, 3.488791995, 3.28108097, 3.027816988, 2.968221955, 2.75019805, 3.2710470039999997, 2.934337826, 2.74322401, 2.926310097, 2.99114702, 2.916463762, "Cluster 0" ], [ "Tunisia", 2.8943399860000003, 2.9873341, 2.6998275119999997, 2.9193048719999997, 2.898708402, 2.961609952, 2.834447949, 2.80141766, 2.833405347, 2.913685908, 2.866036298, 2.9550662180000002, 2.95239633, 3.041912298, 3.5073788560000003, 3.829212473, 4.167224012, 4.157872526, 4.229623294, 3.968816495, "Cluster 0" ], [ "East Asia & Pacific", 4.429089623, 4.203151524, 4.244351189, 4.4539837680000005, 4.626919635, 4.688849242, 4.684790174, 4.6135370689999995, 4.635098319, 4.626696416000001, 4.566215205, 4.367145726, 4.29739389, 4.43484819, 4.865241195, 4.7758171439999995, 4.871726678, 4.866869481, 4.643220952, 4.571447568, "Cluster 0" ], [ "Turkey", 1.76287716, 2.007166944, 2.244024053, 2.5846704, 2.913115705, 3.1142396469999998, 3.512553806, 3.786278215, 3.839653198, 3.826071088, 3.696382908, 3.971039668, 4.095218575, 4.435295202, 4.922531997, 4.412270438999999, 4.205859804, 4.1491432999999995, 4.225639909, 4.193778968999999, "Cluster 0" ], [ "Ukraine", 5.088198574, 4.78908302, 4.193678375, 3.540202425, 2.942150479, 2.895454814, 3.0721386930000003, 3.514016208, 4.042590061, 3.869747013, 3.811739442, 3.884569232, 3.9304539430000003, 3.825090501, 4.292353932, 4.421334806, 3.729821242, 4.12524044, 4.150794905, 3.6045211210000003, "Cluster 0" ], [ "Antigua and Barbuda", 2.746344563, 2.505800464, 2.597402599, 2.6720647769999997, 2.744200045, 2.78780548, 2.949759953, 2.950231444, 2.950013005, 2.67979353, 2.950098595, 2.9501058739999997, 2.9499999960000003, 3.3430313860000003, 3.3438995960000004, 3.893547142, 3.8910395589999998, 3.652332634, 3.592597393, 3.7846106760000002, "Cluster 0" ], [ "Europe & Central Asia (IDA & IBRD countries)", 3.537976062, 3.612690525, 4.047882124, 3.552856873, 3.4807646410000004, 3.385148495, 3.605372687, 3.816964108, 3.794325476, 3.642164316, 3.6815884189999997, 3.721762687, 3.7981816160000004, 3.951117848, 4.401010223, 4.068056417, 3.818966004, 3.9016659039999997, 3.8579794, 3.846191068, "Cluster 0" ], [ "Latin America & the Caribbean (IDA & IBRD countries)", 2.956811011, 2.8777881119999997, 2.968040205, 3.004957842, 3.20538333, 3.0270711969999997, 3.1075857360000003, 2.9494428210000003, 2.962835975, 3.036156959, 3.0753731689999997, 3.0956160919999998, 3.153372508, 3.2389997839999998, 3.700609301, 3.5632974539999998, 3.5165400680000003, 3.452393518, 3.551660225, 3.7318080030000003, "Cluster 0" ], [ "Latin America & Caribbean (excluding high income)", 2.996164912, 2.9066398089999996, 3.008480229, 3.040838015, 3.2475128189999998, 3.059905096, 3.146714937, 2.9871068739999997, 3.037261298, 3.0705763210000003, 3.166319862, 3.1677693789999997, 3.2753891889999998, 3.337349586, 3.804703623, 3.638582097, 3.591022045, 3.496118138, 3.606970928, 3.7073110839999996, "Cluster 0" ], [ "Latin America & Caribbean", 2.984770895, 2.9017704010000003, 2.990421248, 3.029994934, 3.235733893, 3.0606926660000005, 3.144669013, 2.998687771, 3.012572927, 3.0775050760000005, 3.161939378, 3.1608411760000004, 3.255992195, 3.335194417, 3.8119949810000002, 3.6386887339999996, 3.592871857, 3.509236607, 3.6191427860000003, 3.73231283, "Cluster 0" ], [ "Europe & Central Asia (excluding high income)", 3.401579475, 3.4078958989999997, 4.035214654, 3.4127523760000003, 3.222938325, 3.1671554810000004, 3.357613026, 3.60566463, 3.621672658, 3.4729823339999997, 3.506735617, 3.566116863, 3.6357801139999997, 3.735160497, 4.21818788, 3.878112626, 3.6528350869999997, 3.7801599689999996, 3.736001803, 3.714756912, "Cluster 0" ], [ "Thailand", 1.9694428380000002, 2.150730975, 2.536894078, 2.455703581, 2.314820676, 2.302887157, 2.292282152, 3.330872158, 3.467646858, 3.33413422, 3.3812775669999997, 3.904107096, 4.608862415, 4.7146609, 4.734495331000001, 4.441559229, 4.995567322, 5.237115011, 5.265840143999999, 5.615380522000001, "Cluster 0" ], [ "Uruguay", 3.880155497, 3.424728604, 2.61225038, 2.586152727, 2.918063853, 2.711547548, 2.314327052, 2.044716466, 1.7534277219999999, 7.293884084, 7.069810766, 7.2450250910000005, 4.593274899, 5.297812748999999, 5.352676888, 5.372432, 5.520950685, 5.947088677999999, 6.074635227999999, 6.111484304, "Cluster 0" ], [ "Central Europe and the Baltics", 4.678528481, 4.753208836000001, 4.604573867, 4.499987761, 4.679082306000001, 4.539710822, 4.6662723889999995, 4.900195789, 5.100249244, 4.913629428, 4.9708614110000005, 4.841450127, 4.80905668, 5.054785185, 5.3949206279999995, 5.284380429, 5.096212404, 5.041317268, 5.029265785, 5.017716676, "Cluster 0" ], [ "Algeria", 2.6735943559999997, 2.50218252, 2.553365736, 2.527980384, 2.383331292, 2.55856124, 2.97171746, 2.85227361, 2.802237023, 2.566248072, 2.280233074, 2.334850671, 2.7055707910000004, 3.0628038930000003, 3.83796598, 3.593208526, 3.7757293080000003, 4.52025089, 5.188359049, 5.24414553, "Cluster 0" ], [ "Andorra", 3.9826832960000003, 4.235647223, 4.297070495, 5.737580229, 3.9334656389999996, 3.976548227, 3.979763508, 4.109589041, 3.946179815, 3.91626014, 3.4597088489999996, 3.5661223730000002, 4.586322912, 4.825070819, 5.037537144, 6.242026697000001, 4.926289306, 5.747039877000001, 9.692356794, 6.341446004, "Cluster 0" ] ], "hovertemplate": "Cluster=%{customdata[21]}
Country Name=%{customdata[0]}
1995=%{customdata[1]}
1996=%{customdata[2]}
1997=%{customdata[3]}
1998=%{customdata[4]}
1999=%{customdata[5]}
2000=%{customdata[6]}
2001=%{customdata[7]}
2002=%{customdata[8]}
2003=%{customdata[9]}
2004=%{customdata[10]}
2005=%{customdata[11]}
2006=%{customdata[12]}
2007=%{customdata[13]}
2008=%{customdata[14]}
2009=%{customdata[15]}
2010=%{customdata[16]}
2011=%{customdata[17]}
2012=%{customdata[18]}
2013=%{customdata[19]}
2014=%{customdata[20]}", "legendgroup": "Cluster 0", "marker": { "color": "#636efa" }, "name": "Cluster 0", "notched": true, "offsetgroup": "Cluster 0", "showlegend": false, "type": "box", "x": [ "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0", "Cluster 0" ], "xaxis": "x2", "yaxis": "y2" }, { "alignmentgroup": "True", "bingroup": "x", "hovertemplate": "Cluster=%{x}
count=%{y}", "legendgroup": "Cluster 1", "marker": { "color": "#EF553B", "opacity": 0.7 }, "name": "Cluster 1", "offsetgroup": "Cluster 1", "orientation": "v", "showlegend": true, "type": "histogram", "x": [ "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1" ], "xaxis": "x", "yaxis": "y" }, { "alignmentgroup": "True", "customdata": [ [ "Micronesia, Fed. Sts.", 8.69618637, 8.135027023, 7.277088411, 6.4621381829999995, 7.064856562999999, 7.353309875, 8.006993747000001, 7.414073857999999, 9.029862856, 9.899822595, 11.3112, 11.03399209, 11.13554688, 11.6954023, 12.1732852, 12.61078232, 12.53821521, 11.58813926, 12.08993842, 12.43375207, "Cluster 1" ], [ "Kiribati", 8.96847138, 8.797772304, 8.982999914, 6.656954317, 8.444216993, 7.5829204820000005, 8.491803281000001, 8.563909775, 9.467625904, 9.892086335, 9.460431655, 9.359712228, 11.40077075, 10.31166521, 10.36476503, 8.725609752999999, 8.568862275, 8.313609463999999, 8.232914284, 8.291027024, "Cluster 1" ], [ "Finland", 5.627186976, 5.753535627000001, 5.563132051, 5.326593103, 5.268778053999999, 5.144464163, 5.343613088, 5.657160032, 5.932232517999999, 6.017266103, 6.2218654739999995, 6.27918843, 6.031731023, 6.253821942999999, 6.896822789, 6.73883183, 6.753551156, 7.040839875, 7.204016684, 7.289814272999999, "Cluster 1" ], [ "France", 8.058218715, 8.042808693, 7.944487318999999, 7.844248058, 7.831247747999999, 7.759499572999999, 7.848666574, 8.141653894, 8.127820878, 8.20640927, 8.266337172, 8.173183403, 8.118287794, 8.16933746, 8.74652319, 8.679104958, 8.731135953999999, 8.826051795, 8.910694046, 9.024514376, "Cluster 1" ], [ "United Kingdom", 5.613873295, 5.574901951, 5.216401283, 5.273439395, 5.503507084, 5.523467366, 5.765949885, 6.040016206000001, 6.209568, 6.482429976000001, 6.658344919, 6.826598411, 6.794481096, 7.220152923, 8.162898056, 7.94167603, 7.765411293, 7.80263316, 7.780480937999999, 7.578850169, "Cluster 1" ], [ "Germany", 7.678673477, 8.117369547000001, 8.08569888, 8.040406659, 8.012330015, 7.9987526429999996, 8.03376379, 8.181587749, 8.289385968, 7.9198192579999995, 8.006701839, 7.85851875, 7.7325195110000005, 7.9017386620000005, 8.709862289, 8.575730796, 8.307622306, 8.361114536, 8.569493975, 8.697237324, "Cluster 1" ], [ "Malta", 3.819517745, 4.105345357, 4.384384401, 4.443696789, 4.393656255, 4.742394807, 4.8342677489999994, 5.429400948, 5.542024248, 5.653685894, 5.997448889, 6.0463126979999995, 5.482240553, 5.156232157, 5.2500287619999995, 5.219545076, 6.462012081, 6.6252345660000005, 6.554282826000001, 6.74343039, "Cluster 1" ], [ "Greece", 4.301359499, 4.325647391, 4.232330999999999, 4.1185477530000005, 4.34042636, 4.5622111, 5.146070341000001, 5.055646368000001, 5.14686853, 4.90873744, 5.627319096, 5.790832345, 5.677828365, 5.84985855, 6.781079862, 6.2163537479999995, 6.682802397000001, 6.274430226000001, 6.066287526, 4.985039193, "Cluster 1" ], [ "Portugal", 4.645839437, 5.024970483, 5.049986861, 5.117457254, 5.3179309130000005, 6.193279482, 6.233144247999999, 6.4624051929999995, 6.564295702000001, 6.8934000829999995, 6.989928936, 6.5834602, 6.506712635, 6.674037277, 7.160521451, 7.171492441, 6.70065608, 6.238911387000001, 6.2321554379999995, 6.158189113, "Cluster 1" ], [ "Austria", 7.137100143, 7.096256981, 7.356728587999999, 7.478719544, 7.648251788, 7.536366526, 7.503314227000001, 7.606508347999999, 7.736479762, 7.791336459, 7.83141883, 7.737932786, 7.775802592000001, 7.995856889, 8.466129609, 8.400006947, 8.213674722999999, 8.417189562, 8.370613437000001, 8.72502572, "Cluster 1" ], [ "European Union", 6.506458015, 6.584349032, 6.447821826, 6.395838336000001, 6.453924272, 6.4399001160000005, 6.570972316000001, 6.747120362, 6.899522022999999, 6.9109638470000005, 7.051118847000001, 7.087790266, 7.002368177999999, 7.256592777000001, 7.936430028999999, 7.820468929, 7.744258462, 7.79306822, 7.8369536570000005, 7.818446175, "Cluster 1" ], [ "Japan", 5.451500805, 5.342586047, 5.469916116, 5.652911799, 5.909097683, 6.087614007000001, 6.297406178999999, 6.361552576, 6.420410051, 6.47273952, 6.657459568999999, 6.596439242000001, 6.715044868, 6.995021791, 7.753493212, 7.861969364, 8.318249839, 8.409920777, 8.528219096, 8.550081685, "Cluster 1" ], [ "Australia", 4.775232585, 4.856308024, 5.016476282, 5.084647809, 5.326927409, 5.399511666, 5.42099866, 5.620660145, 5.50612734, 5.724898888999999, 5.661448484, 5.660886591000001, 5.765876395, 5.927631008, 6.186556011, 6.127334253, 6.315378278, 6.285633269, 6.274917138999999, 6.316592657999999, "Cluster 1" ], [ "Norway", 6.499858794, 6.45280883, 6.697116683, 7.454887071, 7.547604056, 6.82382819, 7.22396035, 8.027209665, 8.247464055, 7.888860771, 7.430282026, 7.062887755, 7.219227008, 7.091172877000001, 8.021737678, 7.839228687, 7.717230788999999, 7.773855997999999, 8.005414287, 8.309618200000001, "Cluster 1" ], [ "Netherlands", 5.286854099999999, 4.9482342180000005, 5.071556448, 4.849467046, 4.722084285, 4.682621338, 4.89473375, 5.2119207030000005, 5.627419176, 5.591158703, 6.668937025, 7.974464533, 7.980489499, 8.209741428, 8.901516849, 9.081296075, 9.085857928, 9.528421586, 9.617134752, 9.481132729, "Cluster 1" ], [ "United States", 5.9094787879999995, 5.891274291, 5.830750135, 5.676669198, 5.613684996, 5.653471017999999, 6.074098006, 6.423940796, 6.618867537000001, 6.69810039, 6.722608977999999, 6.882532539, 7.01636006, 7.367883673, 8.014549675, 8.079784435, 8.07412666, 8.042357809, 8.045006773999999, 8.278517711000001, "Cluster 1" ], [ "Iceland", 6.88713759, 6.797412968, 6.493117315, 7.037368982, 7.77504317, 7.5449804160000005, 7.405369028, 8.074375998999999, 8.231289339, 7.794296374, 7.499485021, 7.349510337999999, 7.225443543, 7.2743097820000004, 7.479480519, 7.116064072, 6.972243353, 6.994047937, 7.067580829, 7.179705939, "Cluster 1" ], [ "Italy", 5.020894767, 5.084493833, 5.286288745, 5.300234371, 5.384669776, 5.704658031, 5.973164167999999, 6.07690275, 6.07045375, 6.414766985, 6.644147576, 6.7435972920000005, 6.487839661000001, 6.836653592999999, 7.248665862999999, 7.256673496, 6.969185175, 6.993120899, 6.967351379, 6.992651033, "Cluster 1" ], [ "High income", 5.8528186589999995, 5.861951134, 5.81180873, 5.837542174, 5.859037054, 5.853669228999999, 6.131478777000001, 6.354331656, 6.509857349, 6.545027623999999, 6.604202186, 6.657364768, 6.685402534, 6.945781465, 7.638854311, 7.562423022000001, 7.546564171, 7.556054525, 7.573148687000001, 7.6586505670000005, "Cluster 1" ], [ "New Zealand", 5.362051931, 5.283706171, 5.486240926, 5.787903257000001, 5.731562231, 5.827839126000001, 5.791984927000001, 6.146520495, 6.041511196, 6.281577112999999, 6.572475187, 6.922995765, 6.883399708, 8.906984606, 9.323010285, 9.305461872999999, 9.342877083, 9.547666612999999, 9.226556936, 9.082656345, "Cluster 1" ], [ "Palau", 8.650190111, 8.769106997, 8.390541575, 7.07424594, 7.624323455, 6.370625003, 6.1851190460000005, 5.948520708999999, 6.0942528739999995, 6.490673575, 5.895631066, 6.342105263, 6.559764147999999, 6.540845072000001, 6.614646467999999, 7.641116751, 6.548387094, 6.739224139, 6.599186992000001, 6.531970262000001, "Cluster 1" ], [ "World", 5.286303621, 5.246769791, 5.19680285, 5.227929882, 5.2749122989999995, 5.2211192539999995, 5.444044382, 5.633904668, 5.765420482000001, 5.755465472000001, 5.733553112999999, 5.701873011, 5.65229917, 5.78265714, 6.32094847, 6.075446192999999, 5.982564844, 5.940788187000001, 5.921679595, 5.994028234, "Cluster 1" ], [ "Sweden", 6.901266869, 7.1283580970000004, 6.888226931, 6.962480445, 7.027549767000001, 6.943698089, 7.188240259, 7.513944417, 7.634858717999999, 7.3951965379999995, 7.354150307, 7.259516112999999, 7.254788683999999, 7.521564636, 8.100547687, 7.7183103289999995, 9.914691787999999, 9.955521086000001, 10.05201524, 10.02469431, "Cluster 1" ], [ "Cuba", 4.648496225, 4.756708361, 4.986951137, 5.226020532, 5.474999382999999, 5.509533717, 5.670491082000001, 5.724849955, 5.648789044, 5.468185582, 8.744448247000001, 7.081250077999999, 9.883198101, 10.29335824, 11.28391889, 9.70382827, 10.07101019, 8.088255377000001, 8.962294541, 10.57366249, "Cluster 1" ], [ "Switzerland", 4.999426018, 5.292310568, 5.3136251660000005, 5.381639812, 5.51555988, 5.492175839, 5.852946307000001, 6.123779435, 6.379751456, 6.4003113570000005, 6.459405675, 6.141737847999999, 6.032418431, 6.703738631, 7.209714872999999, 7.09727006, 7.2009273579999995, 7.498784843999999, 7.733805564, 7.695117355, "Cluster 1" ], [ "Slovak Republic", 5.367669133, 5.708260171, 5.302839859, 5.179371767, 5.157902597, 4.915242275, 4.914849534, 5.013706746, 5.138875209, 5.319742082, 5.241058358, 5.020215772, 5.184301959, 5.4353000510000005, 6.012034516, 5.797130372000001, 5.643904536, 5.679221056, 5.7880822, 5.8395992020000005, "Cluster 1" ], [ "Post-demographic dividend", 5.923737902999999, 5.937932599, 5.892328742999999, 5.914243707000001, 5.932601223, 5.939920697000001, 6.2178511610000005, 6.445490047000001, 6.611676409, 6.657098828, 6.744363002999999, 6.812281987, 6.853256687000001, 7.145683267000001, 7.822250526, 7.781963316000001, 7.795102793, 7.812069609, 7.833116298999999, 7.914720128, "Cluster 1" ], [ "Serbia", 4.267816797, 4.267816799999999, 4.267816797, 4.2678168030000005, 4.267816797, 4.267816797, 4.600455039, 5.837583112999999, 5.766948594, 5.672611076, 5.742701002, 5.664904303999999, 6.146621793, 6.228211971, 6.12657588, 6.241991647000001, 6.039682906, 6.049713243999999, 5.984362308, 6.416505605, "Cluster 1" ], [ "Spain", 5.3735065539999995, 5.400270122999999, 5.314511603, 5.284405916, 5.269708002, 5.16745964, 5.155738488, 5.168936096, 5.727875546, 5.79793601, 5.875803104, 6.0053206370000005, 6.098790144, 6.512856144, 7.209759954, 7.173242115, 7.001061132, 6.734615203, 6.502610209, 6.399991901, "Cluster 1" ], [ "Lesotho", 3.562259305, 3.780533582, 3.117609003, 3.272044207, 3.239233383, 3.4740210489999996, 4.372510108, 3.831319315, 4.034880661, 3.938291734, 3.309584005, 4.175710594, 5.597512217, 6.059683765, 7.000413737000001, 8.079925072, 9.087435867, 8.447350944, 8.408564819, 8.082167603, "Cluster 1" ], [ "Europe & Central Asia", 6.258717592999999, 6.339840985, 6.249748329, 6.19495497, 6.269452692000001, 6.207590774, 6.357420652, 6.543767225, 6.68023106, 6.643569576, 6.70922848, 6.691295997, 6.590409565, 6.775062286, 7.489585233, 7.256678468, 7.09676356, 7.10705862, 7.143518692000001, 7.184029645, "Cluster 1" ], [ "Maldives", 3.662613659, 3.603093758, 3.54408858, 4.648466888, 4.74957875, 5.119448212, 3.7002680060000004, 3.567182597, 3.778200959, 3.8768776689999997, 7.126649771, 5.237830448, 4.553267366, 7.025877902, 6.729711552, 5.273435237, 5.608781865, 6.50292714, 8.263833455, 10.75705209, "Cluster 1" ], [ "Costa Rica", 4.9819644169999995, 5.065507246, 4.838992757, 5.6371740610000005, 5.362922535, 5.61242476, 5.485507511000001, 6.2834759920000005, 6.450275287, 5.653259257, 5.4657120589999995, 5.397313924, 5.627837325, 6.261310673, 7.022189965, 7.092617051, 7.149714006, 7.000226946000001, 6.914441165, 6.76760152, "Cluster 1" ], [ "Canada", 6.3135005, 6.112419052999999, 6.033111823, 6.228970762, 6.107698328, 6.098426758, 6.3649046810000005, 6.514305746000001, 6.694243642999999, 6.719901986, 6.723559526, 6.788407822999999, 6.893501359, 7.063453852, 7.914158212, 7.88439634, 7.676792501, 7.651144554, 7.575664927999999, 7.4119318839999995, "Cluster 1" ], [ "OECD members", 5.837047317000001, 5.841498345, 5.7873592060000005, 5.793233257000001, 5.816090555, 5.809017258, 6.0848777929999995, 6.308109241, 6.476244914, 6.522930721, 6.584750763, 6.646100419, 6.68397179, 6.97570711, 7.653295827000001, 7.58452343, 7.588942977, 7.608825853, 7.617928345, 7.692358487999999, "Cluster 1" ], [ "Croatia", 5.8306697629999995, 6.135021776, 4.893760696, 5.7330917679999995, 6.326324594, 6.6022750629999996, 5.96435491, 4.955064171, 5.242817131, 5.314158705, 5.930617257000001, 5.984641875, 6.477622756000001, 6.538722947999999, 7.006867431, 7.064964214, 6.25541215, 6.363207061000001, 6.403028794, 6.388287591, "Cluster 1" ], [ "Ireland", 4.669802976000001, 4.541905478, 4.6448398619999995, 4.494538697, 4.461866317, 4.466601084, 4.911672749, 5.1711671, 5.402683783, 5.5962288860000005, 5.520724187999999, 5.443878625, 5.729910174, 6.513027123, 6.917241581, 6.101439901, 5.5260434620000005, 5.622416984, 5.333288818, 5.141484076, "Cluster 1" ], [ "North America", 5.9389948960000005, 5.907198654, 5.845014468, 5.71256593, 5.645996433, 5.683423459, 6.092951705, 6.429777137, 6.624290735, 6.699777867000001, 6.722686909, 6.874371534, 7.005070493, 7.338893627999999, 8.005831942999999, 8.060768597000001, 8.033060722, 8.002663479, 7.998392667, 8.197720774, "Cluster 1" ], [ "Czech Republic", 6.084042522000001, 5.812945806, 5.779225055, 5.803851213, 5.744610454, 5.702534921, 5.7649027539999995, 6.149834668, 6.404474042, 6.15449697, 6.054044375, 5.805408814, 5.556626261, 5.628784423, 6.5696540279999995, 6.22493667, 6.314732469, 6.341764994, 6.313087853, 6.264976383, "Cluster 1" ], [ "Denmark", 6.7053440470000005, 6.76753736, 6.706312228, 6.694654162000001, 7.517019335, 7.29518541, 7.660538886, 7.885050087000001, 8.039900364, 8.152818891, 8.253254964, 8.399549167, 8.429011642999999, 8.621214821, 9.756125393, 9.433817543, 9.26885262, 9.419660272, 9.593210322000001, 9.158734109, "Cluster 1" ], [ "Euro area", 6.716641592, 6.819911767000001, 6.775234333999999, 6.713451942000001, 6.707802202000001, 6.725721019, 6.824762086000001, 6.9704907160000005, 7.100569779, 7.08237852, 7.243410635, 7.2751367270000005, 7.183725909, 7.419702701, 8.060334166, 7.985294914, 7.851059524, 7.904805463, 7.961558065, 8.001479856, "Cluster 1" ], [ "Belgium", 5.845320714, 6.184037715, 5.853458122999999, 5.899438234, 6.023602106, 6.058374214, 6.2528146289999995, 6.24450897, 6.9180965510000005, 7.127857092999999, 7.112748229, 6.962370453999999, 6.952936769, 7.396754446, 8.043822364, 7.896702726, 8.006737375, 8.186298971, 8.226719108, 8.249989468999999, "Cluster 1" ], [ "Slovenia", 5.792909005, 5.819026492000001, 5.819143855, 5.897932514, 5.900414841, 6.116332806, 6.280502195, 6.32476385, 6.314120889, 6.221904529, 6.212733312999999, 6.122382991, 5.773929573999999, 6.291263917999999, 6.9246336820000005, 6.72862594, 6.673550483, 6.803887187000001, 6.668260437000001, 6.623821787000001, "Cluster 1" ], [ "Bosnia and Herzegovina", 3.3504531589999997, 4.802890013, 3.4999255760000003, 3.329547245, 4.7307526289999995, 4.032095716000001, 4.312505733, 4.422546498, 5.478547872, 5.173272164, 4.865928659, 4.979969839, 5.334221943, 5.812860562000001, 6.803551255, 6.788921332, 6.923006484, 7.080212274, 6.629772276000001, 6.813077082, "Cluster 1" ], [ "Luxembourg", 5.145716534, 5.245560163, 5.173766337, 5.237903806, 5.232189737, 6.361267183, 6.236389009, 7.070858488, 6.457623507, 6.958297657999999, 6.747706438, 6.597379851, 5.82007398, 6.492969779, 7.025644269, 6.594701877, 6.26066183, 5.988070914, 5.9392373229999995, 5.822836062, "Cluster 1" ] ], "hovertemplate": "Cluster=%{customdata[21]}
Country Name=%{customdata[0]}
1995=%{customdata[1]}
1996=%{customdata[2]}
1997=%{customdata[3]}
1998=%{customdata[4]}
1999=%{customdata[5]}
2000=%{customdata[6]}
2001=%{customdata[7]}
2002=%{customdata[8]}
2003=%{customdata[9]}
2004=%{customdata[10]}
2005=%{customdata[11]}
2006=%{customdata[12]}
2007=%{customdata[13]}
2008=%{customdata[14]}
2009=%{customdata[15]}
2010=%{customdata[16]}
2011=%{customdata[17]}
2012=%{customdata[18]}
2013=%{customdata[19]}
2014=%{customdata[20]}", "legendgroup": "Cluster 1", "marker": { "color": "#EF553B" }, "name": "Cluster 1", "notched": true, "offsetgroup": "Cluster 1", "showlegend": false, "type": "box", "x": [ "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1", "Cluster 1" ], "xaxis": "x2", "yaxis": "y2" }, { "alignmentgroup": "True", "bingroup": "x", "hovertemplate": "Cluster=%{x}
count=%{y}", "legendgroup": "Cluster 2", "marker": { "color": "#00cc96", "opacity": 0.7 }, "name": "Cluster 2", "offsetgroup": "Cluster 2", "orientation": "v", "showlegend": true, "type": "histogram", "x": [ "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2" ], "xaxis": "x", "yaxis": "y" }, { "alignmentgroup": "True", "customdata": [ [ "Vietnam", 1.757862744, 1.632231732, 1.604611275, 1.731437579, 1.717060034, 1.513863444, 1.627560706, 1.447735609, 1.551822426, 1.393649581, 1.4195695640000001, 1.94486753, 2.563552268, 2.1319632019999997, 2.5691874219999997, 2.9609666289999996, 2.805001867, 3.722124141, 3.796360562, 3.820019105, "Cluster 2" ], [ "Morocco", 1.184133718, 1.14335155, 1.073390243, 1.179102117, 1.149141903, 1.229737845, 1.427759227, 1.378808948, 1.39499543, 1.4295298019999998, 1.4389258669999998, 1.7144025040000002, 1.8980773180000001, 1.891971766, 2.046396065, 2.0675720369999997, 2.08777206, 2.181466365, 1.95774948, 2.001326276, "Cluster 2" ], [ "Nepal", 1.407378795, 1.42214041, 1.4710270630000002, 2.554396091, 1.763231864, 1.352123349, 1.5944633019999999, 1.640840974, 1.527687611, 1.590326576, 1.585328429, 2.044874971, 2.2831250830000003, 2.725698705, 2.824395263, 2.867317073, 3.24209748, 2.466854595, 2.2199025619999997, 2.337819114, "Cluster 2" ], [ "Myanmar", 0.40560317, 0.33454759, 0.262807177, 0.16829349300000002, 0.170964179, 0.26099717100000003, 0.224982015, 0.313588382, 0.243334548, 0.266961522, 0.164974085, 0.256312052, 0.19819528600000003, 0.207554701, 0.232553662, 0.299251928, 0.297624635, 0.819629102, 0.826846155, 1.0448998040000002, "Cluster 2" ], [ "Venezuela, RB", 1.803152127, 1.482414909, 1.3873164880000002, 1.466015602, 1.83342208, 2.163059483, 2.3407567019999997, 2.1513320019999997, 2.079300496, 2.158140627, 2.153332428, 2.221770123, 2.4647812030000003, 1.230489115, 2.496312442, 2.088239278, 2.33545129, 1.675638027, 1.5428590880000002, 1.5427659459999998, "Cluster 2" ], [ "Mongolia", 2.598917911, 3.0338893369999997, 3.06342556, 3.4813274830000003, 3.417399945, 3.828286275, 3.89985284, 3.455279064, 2.918031289, 2.92676436, 2.484591225, 2.3969135919999998, 2.736412235, 3.18351906, 2.768372713, 2.654478067, 2.595706257, 2.260514895, 2.21159453, 2.620572882, "Cluster 2" ], [ "Uzbekistan", 3.6000000030000003, 3.7000000010000003, 3.300000002, 2.9445866919999997, 2.804581287, 2.5156908159999998, 2.5501141069999997, 2.424055326, 2.3806037019999997, 2.26249735, 2.279013274, 2.4548033890000003, 2.298687476, 2.529900054, 2.619290185, 2.7513171560000003, 2.863900619, 3.1273714530000003, 3.117906257, 3.11124825, "Cluster 2" ], [ "United Arab Emirates", 2.0817381580000003, 1.948805565, 1.9483958190000001, 2.056706777, 1.9176294719999998, 1.6770585919999998, 1.944492099, 1.7139829819999999, 1.67154037, 1.45604253, 1.36889725, 1.3825069509999999, 1.5553772380000002, 1.9216341030000001, 3.0341259469999997, 2.834165586, 2.732488042, 2.550025889, 2.557326087, 2.636151579, "Cluster 2" ], [ "Nigeria", 0.658145013, 0.6004809210000001, 0.717612288, 0.9066261859999999, 0.9836661459999999, 0.949286025, 1.0177073509999999, 0.622004345, 0.9066617840000001, 1.4147604390000001, 1.19778681, 1.204600858, 1.472728808, 1.470059403, 1.324670016, 0.908580697, 1.151611248, 1.033169532, 0.8826272559999999, 0.9225351270000001, "Cluster 2" ], [ "Sudan", 0.785822105, 1.1132446329999999, 0.8913511359999999, 0.947423065, 0.7634364029999999, 0.887398963, 0.755115843, 0.7832779759999999, 0.883215533, 1.080722762, 1.091364, 1.270562706, 1.511842397, 2.630955513, 2.356734868, 2.698468913, 2.557343508, 1.8717955609999999, 1.859793759, 1.802361864, "Cluster 2" ], [ "St. Kitts and Nevis", 3.210272875, 3.167420812, 2.96495957, 3.0322580639999996, 3.038774765, 2.572590516, 2.262442891, 2.091861802, 2.087233898, 1.8705093169999998, 1.9221866930000002, 2.336683006, 2.154610635, 2.030668845, 2.193108956, 2.532022242, 2.26067011, 2.375174636, 2.183728661, 2.144605023, "Cluster 2" ], [ "Sri Lanka", 1.615371713, 1.611450175, 1.520769471, 1.878021898, 1.7467114680000002, 1.846321629, 1.7582096980000002, 1.6833360119999998, 1.677615192, 2.005508786, 1.85010327, 1.950059208, 1.825976447, 1.5815241269999998, 1.53517067, 1.5538039369999999, 1.38092651, 1.219599412, 2.102564149, 1.96395333, "Cluster 2" ], [ "Syrian Arab Republic", 2.189237706, 1.9540946959999999, 1.8777604769999998, 1.960923229, 2.01442573, 1.989779169, 2.173051471, 2.262242934, 2.4683381680000003, 2.148408978, 2.075568445, 1.833546841, 1.7896512969999998, 1.5964767030000002, 1.631376352, 1.507165795, 1.507165794, 1.507165792, 1.507165795, 1.507165795, "Cluster 2" ], [ "Tajikistan", 1.289444392, 1.296720852, 1.601227323, 1.141229192, 1.040832288, 0.946474655, 0.9497662490000001, 0.9065827479999999, 0.910560376, 0.94333442, 1.1438192790000001, 1.129053783, 1.184751796, 1.371774183, 1.478536975, 1.594683309, 1.71027997, 1.87760452, 2.067731786, 1.983765009, "Cluster 2" ], [ "Tanzania", 1.3671389859999998, 1.174080484, 1.127228367, 1.009735219, 1.1200299009999999, 1.1459393759999998, 1.769595394, 2.106622222, 2.573524874, 2.565945049, 2.965165865, 4.763505728, 3.038471158, 2.435878095, 2.109638156, 2.072897335, 2.4866151380000003, 2.790460229, 2.565408087, 2.589958711, "Cluster 2" ], [ "Togo", 1.5142425659999998, 1.476366118, 1.263694426, 1.5228179240000002, 1.4206208740000001, 1.420842968, 1.25272483, 0.906148993, 1.441999812, 1.6843732040000001, 1.898455965, 2.2596331419999998, 2.157573571, 2.416491795, 3.2782154439999998, 1.9385851369999998, 1.655337459, 1.947797344, 2.148307048, 2.01732113, "Cluster 2" ], [ "Singapore", 1.456150914, 1.391903127, 1.344772866, 1.66411043, 1.4782905990000001, 1.217784989, 0.887039769, 1.0589667740000002, 1.346161446, 1.030256162, 1.003758123, 1.0010905540000001, 0.955389862, 1.20049011, 1.526597419, 1.3714286169999998, 1.346479037, 1.501077737, 1.735920655, 2.054683314, "Cluster 2" ], [ "Sierra Leone", 2.388388089, 2.163428251, 2.513163766, 2.0471494480000003, 3.064624564, 3.49413205, 2.824141502, 2.9649160219999997, 2.784261175, 2.683917256, 2.676174105, 1.961695331, 1.645375923, 1.7879205000000002, 2.2075173169999998, 2.396940634, 2.646933502, 1.980878492, 1.6946554809999999, 1.8838018559999998, "Cluster 2" ], [ "Mexico", 2.130169342, 1.9017575580000001, 2.108606157, 2.209776657, 2.3947401530000003, 2.318107511, 2.39862085, 2.4220273480000003, 2.541277434, 2.688003906, 2.618877856, 2.560345155, 2.6423747680000003, 2.7609368169999997, 3.095935571, 3.103295671, 3.067131298, 3.160971159, 3.2569934060000003, 3.2595515739999996, "Cluster 2" ], [ "Niger", 1.46894782, 1.28448572, 1.6847956030000002, 1.6945951419999998, 1.6988028130000001, 1.5224654819999999, 1.8667212, 1.909258365, 1.6804503130000001, 1.845863957, 2.978654315, 3.175497048, 2.662864682, 2.6958767939999997, 2.650386504, 2.162436939, 2.453245216, 2.211834697, 2.455677176, 3.214493821, "Cluster 2" ], [ "Senegal", 1.2798538309999998, 1.4840143330000002, 1.2842599890000002, 1.311168581, 1.741001217, 1.8955416319999998, 2.135240269, 1.95048094, 2.09132832, 2.1192570930000003, 2.9824374189999996, 3.149901608, 2.3325124280000002, 2.52752637, 2.486263648, 2.368547813, 2.2798394, 2.179866218, 2.238315424, 2.41795607, "Cluster 2" ], [ "Trinidad and Tobago", 2.638269986, 2.386765057, 2.344393146, 1.952658896, 2.344861306, 1.9555948980000002, 2.226981196, 2.647006573, 2.599973229, 2.599777231, 2.641981687, 2.2319773019999998, 2.37526743, 2.164450301, 3.2808106789999996, 3.018338697, 2.680151372, 2.894988852, 3.144494274, 3.174627521, "Cluster 2" ], [ "Rwanda", 1.639887766, 1.875693261, 1.8534048269999999, 2.558416099, 2.083504954, 1.65315324, 2.138891489, 2.182617409, 3.345043303, 2.875959967, 3.1994948919999997, 4.98059157, 3.780193618, 2.8301189489999996, 2.402053946, 2.928013553, 2.810805898, 2.835877205, 2.9251774489999995, 2.86940115, "Cluster 2" ], [ "Turkmenistan", 1.8558282190000002, 2.261439427, 3.479223681, 3.501250448, 2.385819704, 3.214627605, 2.817917069, 2.43147657, 2.708526219, 2.4214305080000003, 2.021050273, 1.5455485169999998, 1.388148149, 0.946836468, 1.163073225, 1.223637874, 1.268097271, 1.273376388, 1.4260022369999998, 1.348530564, "Cluster 2" ], [ "Uganda", 1.419934953, 1.4132376530000001, 1.434781572, 1.895182926, 1.6585483509999999, 1.837958926, 1.9800486640000001, 2.105321926, 1.948108485, 2.265551769, 2.36197808, 2.472357111, 2.461809429, 2.302819536, 1.814334366, 3.118358422, 2.633267177, 2.15389932, 2.087896717, 1.801251317, "Cluster 2" ], [ "Qatar", 2.3204105040000003, 2.494258485, 2.14754465, 2.26219926, 1.9516241730000001, 1.574730065, 1.9219924780000002, 2.035923049, 3.488087043, 3.0369040139999997, 2.535151656, 2.172082184, 1.9433211680000002, 1.574182634, 2.065527913, 1.6208308630000001, 1.5059314080000001, 1.8314776730000002, 1.85480107, 1.87539141, "Cluster 2" ], [ "Philippines", 1.363656828, 1.451424131, 1.558107718, 1.373206902, 1.428355789, 1.526761368, 1.3244430759999999, 1.116642339, 1.306200566, 1.3031314390000002, 1.5016485869999998, 1.452187111, 1.367826516, 1.332745624, 1.54867658, 1.57369151, 1.306362975, 1.386256358, 1.449217044, 1.614685219, "Cluster 2" ], [ "Peru", 2.4000535530000002, 2.439421903, 2.266327886, 2.571913148, 2.829916303, 2.720831514, 2.83143959, 2.825705616, 2.690862148, 2.543761347, 2.69389613, 2.392145848, 2.414623092, 2.452033774, 2.983444427, 2.794287232, 2.624140306, 2.846647646, 3.0451036680000003, 3.31875118, "Cluster 2" ], [ "Paraguay", 2.1300236740000003, 2.395655422, 2.428081297, 2.821045288, 3.030939089, 3.2306281489999997, 2.654111955, 2.16010372, 1.94949197, 2.031570671, 2.355197356, 2.610014991, 2.6921865680000003, 2.713075726, 3.498680631, 3.360902763, 3.765919165, 4.598601243, 4.781259119, 4.502240378, "Cluster 2" ], [ "Pakistan", 0.655509247, 0.7153439309999999, 0.6555669679999999, 0.5714069, 0.55473074, 0.608602423, 0.551524181, 0.80938608, 0.648320921, 0.677300991, 0.6859182840000001, 0.7887748040000001, 0.7988322409999999, 0.839235884, 0.802903527, 0.954234466, 0.919768299, 1.0184630190000001, 0.994330811, 0.9188114740000001, "Cluster 2" ], [ "Oman", 3.060043613, 2.984456681, 2.782569753, 3.0185177010000004, 2.8937463589999997, 2.51203413, 2.528963608, 2.654750721, 2.629465786, 2.437561733, 2.130347883, 1.8645977580000002, 1.968289323, 1.586300815, 2.3007373269999998, 2.269729033, 2.039566518, 2.079956768, 2.4085738130000003, 3.190228575, "Cluster 2" ], [ "Saudi Arabia", 1.5431946069999998, 1.617271884, 1.7527047119999999, 1.945860041, 2.8033962839999997, 3.051834468, 3.25646885, 3.090089872, 2.89642297, 2.561828615, 2.4783645, 2.641391252, 2.5073977469999997, 1.8894052119999998, 2.788237062, 2.2652001090000002, 2.495887158, 2.7522826960000004, 3.1003695560000004, 3.4907897410000004, "Cluster 2" ], [ "Mauritius", 1.9791546869999999, 1.904916232, 1.91146883, 1.954499964, 1.8827777280000002, 1.96954971, 2.004170598, 2.180551666, 2.1883490930000002, 2.349088838, 2.214836795, 2.047507497, 1.872909835, 1.782954216, 2.168691339, 2.5825881280000003, 2.46122411, 2.292702791, 2.3655561919999997, 2.364685746, "Cluster 2" ], [ "Arab World", 2.004867785, 2.0146024280000003, 2.071308732, 2.177711645, 2.331000345, 2.3335961, 2.58875078, 2.54023836, 2.450414915, 2.314914077, 2.134281009, 2.133037666, 2.16687238, 2.101232726, 2.830066845, 2.4896314569999998, 2.539570311, 2.7112619789999997, 2.895427378, 3.0731609939999998, "Cluster 2" ], [ "Chad", 2.011375251, 1.960913759, 1.963588748, 1.659397007, 1.9898415530000002, 2.66748418, 2.396482425, 2.691863992, 2.268320284, 2.299355155, 1.55797137, 1.128978799, 1.2502512209999999, 0.996604191, 1.231522791, 1.185137165, 1.534874565, 1.421939407, 1.774692315, 1.9789501619999998, "Cluster 2" ], [ "Upper middle income", 2.719154058, 2.6691794090000003, 2.8588169989999996, 2.755691745, 2.7583880960000005, 2.64226068, 2.6614438999999996, 2.653640275, 2.7072452680000003, 2.71322832, 2.754573558, 2.798324718, 2.916842398, 3.039129579, 3.401348935, 3.258324431, 3.26052306, 3.3247364010000005, 3.3759578180000003, 3.424686871, "Cluster 2" ], [ "Albania", 1.713004455, 1.7461975459999999, 2.024509405, 2.0951277569999998, 2.510171417, 2.2584179580000003, 2.2922240190000003, 2.256325893, 2.2521041509999997, 2.67940487, 2.7064554430000003, 2.5751360919999997, 2.6291710999999998, 2.69389845, 2.833575743, 2.47656803, 2.84917086, 2.7357041, 2.8359842360000003, 2.936373275, "Cluster 2" ], [ "Angola", 4.659118212, 1.7397817740000001, 2.0192194409999997, 1.414705389, 2.131797787, 1.677216464, 2.812403394, 1.685217542, 2.044369358, 2.407840515, 2.02464638, 3.022435345, 2.213764019, 2.716334452, 2.663917207, 2.0612546640000002, 2.155094274, 2.137316503, 3.080408392, 2.124912195, "Cluster 2" ], [ "Armenia", 1.996272562, 1.621148073, 1.407496163, 1.644913074, 1.612414885, 1.1375319990000001, 1.5914746219999998, 1.361332463, 1.516570269, 1.404450704, 1.905053401, 2.0528820530000003, 2.099284998, 1.764770313, 2.010005376, 1.9227140630000001, 1.938903536, 1.8756815409999998, 1.946690997, 1.925675667, "Cluster 2" ], [ "Azerbaijan", 1.3917525780000002, 1.485547019, 1.228625713, 0.903807033, 0.985430464, 0.866892751, 0.84650113, 0.791817883, 0.82967797, 1.0286700359999998, 0.880905375, 0.86418436, 0.980253879, 0.824675486, 1.33896972, 1.168020723, 1.080987674, 1.210596594, 1.150183905, 1.230967479, "Cluster 2" ], [ "Bahamas, The", 2.729658793, 2.773621504, 2.357290763, 2.539504821, 2.467818788, 2.502547587, 2.466895954, 2.5106654280000003, 2.647886116, 2.880435634, 2.642189647, 3.2726021, 3.18150171, 3.354877435, 3.5265241489999997, 3.4608155039999997, 3.575056242, 3.298249273, 3.07695572, 3.5506726960000004, "Cluster 2" ], [ "Bahrain", 2.818546496, 2.7515132039999997, 3.047721744, 2.881320773, 2.838727708, 2.36241776, 2.532878513, 2.5843232030000003, 2.501123649, 2.267809586, 2.156522233, 2.125250656, 2.184567246, 2.313058037, 2.748444379, 2.593379391, 2.383532755, 2.7626622419999998, 3.015994395, 3.150500297, "Cluster 2" ], [ "Bangladesh", 1.199805247, 1.0312841240000001, 0.968124768, 0.9353350979999999, 0.9351601490000001, 0.946712407, 1.024926461, 1.067809827, 0.975548071, 1.042067184, 0.9668001420000001, 1.038830186, 0.987683698, 0.9537524690000001, 0.991099631, 1.05017299, 1.041090103, 0.984483722, 0.810323956, 0.786532509, "Cluster 2" ], [ "Belize", 2.632365197, 2.048040973, 2.263610979, 2.155696602, 2.035489918, 2.091697325, 2.5894225509999997, 2.456541789, 2.589394307, 2.507171752, 2.647951095, 2.669250969, 3.022312925, 3.290674586, 3.862427163, 3.858381866, 3.725604295, 3.5777434360000004, 3.777130746, 3.879657845, "Cluster 2" ], [ "Benin", 2.111729724, 2.0315509240000003, 1.814422789, 1.939795897, 2.109912315, 1.917526784, 2.308263635, 1.888670405, 2.2112665259999997, 2.175232784, 2.3524798909999998, 2.385750932, 2.307085606, 2.137696725, 2.328624079, 2.688570362, 2.9290097580000003, 2.15409384, 2.215456479, 2.251196286, "Cluster 2" ], [ "Brunei Darussalam", 2.294038745, 3.0164979919999997, 3.01723691, 3.7179108860000003, 3.1839404819999997, 2.59858883, 2.576781266, 2.5673854080000003, 2.593538693, 2.522266585, 2.2158971480000003, 1.929077942, 2.03867096, 2.015774515, 2.591951691, 2.520024437, 2.066757971, 2.112532457, 2.407480899, 2.485567877, "Cluster 2" ], [ "Burkina Faso", 1.8658619580000002, 1.933787219, 2.0678869680000003, 2.061326682, 2.191443603, 2.016915355, 1.832448876, 2.256686535, 2.6042529930000002, 3.464384444, 4.091775992, 3.741064955, 3.995721739, 3.996973964, 3.6583793260000004, 3.9711797669999997, 2.95514785, 2.98036859, 3.48939536, 2.593973739, "Cluster 2" ], [ "Burundi", 1.34643228, 1.4941034169999998, 1.130843622, 1.2478422040000001, 1.238485735, 1.4043644640000001, 1.6344859109999998, 1.55512254, 1.345188237, 2.544952098, 2.937796431, 3.5288293360000003, 3.7804362, 3.355311709, 3.093040181, 5.499656744, 5.401877297, 4.930865336, 4.3966530530000005, 3.9737275569999997, "Cluster 2" ], [ "Cambodia", 1.1239033040000002, 2.642772374, 2.0557185319999998, 1.356775567, 1.184934454, 1.3401496179999999, 1.30376831, 1.520439279, 2.416164271, 2.3923241180000003, 1.618218744, 1.2352885740000001, 1.321770862, 1.1113312290000001, 1.312468532, 1.440774999, 1.33985553, 1.5033406980000001, 1.397584709, 1.251042011, "Cluster 2" ], [ "Cameroon", 0.9002687140000001, 0.893368284, 0.978965995, 0.7846296140000001, 0.8337348240000001, 0.9326291859999999, 1.1291992770000001, 1.290383204, 1.3317280120000001, 1.129638122, 1.120079177, 1.076092314, 1.065776207, 1.049287334, 1.28313286, 1.5076022759999999, 1.331447157, 1.066747097, 1.012469674, 0.9386336909999999, "Cluster 2" ], [ "Sub-Saharan Africa (IDA & IBRD countries)", 2.449863298, 2.516644595, 2.494454088, 2.437191306, 2.374140004, 2.271764359, 2.36589666, 2.179881571, 2.392890886, 2.48694164, 2.485235818, 2.510834419, 2.4624205690000003, 2.5124766309999997, 2.71107721, 2.48903738, 2.624569905, 2.543530054, 2.4598089, 2.314823041, "Cluster 2" ], [ "Sub-Saharan Africa (excluding high income)", 2.447084114, 2.513732415, 2.490668403, 2.433949374, 2.370627245, 2.2691877519999997, 2.363319605, 2.177062415, 2.3902048280000003, 2.484998793, 2.4836869530000003, 2.509609703, 2.4617436809999997, 2.512576224, 2.71133, 2.4885153559999997, 2.6241637030000002, 2.5426359130000002, 2.459070655, 2.3141783609999997, "Cluster 2" ], [ "Sub-Saharan Africa", 2.449863298, 2.516644595, 2.494454088, 2.437191306, 2.374140004, 2.271764359, 2.36589666, 2.179881571, 2.392890886, 2.48694164, 2.485235818, 2.510834419, 2.4624205690000003, 2.5124766309999997, 2.71107721, 2.48903738, 2.624569905, 2.543530054, 2.4598089, 2.314823041, "Cluster 2" ], [ "South Asia (IDA & IBRD)", 1.03503164, 0.99799026, 1.0374988109999999, 1.070832413, 1.081228019, 1.0670523109999999, 1.042238308, 1.032538376, 0.9733766779999999, 1.018914387, 1.103442311, 1.103521575, 1.09051214, 1.151605829, 1.205501388, 1.181098088, 1.181152879, 1.19027209, 1.28224814, 1.3678991719999998, "Cluster 2" ], [ "Caribbean small states", 2.8015183710000002, 2.856683624, 2.9971566689999998, 2.9894512000000004, 2.7678577189999998, 2.826752141, 2.6799687530000003, 2.888692649, 2.740592575, 2.845970706, 2.629579982, 2.650899715, 2.79066499, 2.8229131219999997, 3.408651206, 3.264063783, 3.08765286, 3.3143030839999996, 3.318431579, 3.2600123180000002, "Cluster 2" ], [ "Early-demographic dividend", 2.203164007, 2.156631825, 2.227311469, 2.364099533, 2.454393636, 2.450554821, 2.52708105, 2.347701787, 2.36326343, 2.346823705, 2.337346649, 2.369883662, 2.385250838, 2.405125681, 2.701259981, 2.5071308709999998, 2.495490968, 2.497340218, 2.586701422, 2.665602603, "Cluster 2" ], [ "East Asia & Pacific (excluding high income)", 1.615852443, 1.640251145, 1.6783221080000001, 1.764602604, 1.75401335, 1.689184662, 1.626887281, 1.736855763, 1.8086373709999999, 1.815666676, 1.79631989, 1.8752670930000002, 2.076666145, 2.256213902, 2.5749937469999997, 2.53842979, 2.669787471, 2.8114897130000003, 2.881804892, 2.975050955, "Cluster 2" ], [ "East Asia & Pacific (IDA & IBRD countries)", 1.615852443, 1.640251145, 1.6783221080000001, 1.764602604, 1.75401335, 1.689184662, 1.626887281, 1.736855763, 1.8086373709999999, 1.815666676, 1.79631989, 1.8752670930000002, 2.076666145, 2.256213902, 2.5749937469999997, 2.53842979, 2.669787471, 2.8114897130000003, 2.881804892, 2.975050955, "Cluster 2" ], [ "Heavily indebted poor countries (HIPC)", 1.630562619, 1.7167492340000001, 1.65244635, 1.7718702569999998, 1.834357688, 1.79637023, 2.015090682, 2.068192564, 2.1669018159999998, 2.216858939, 2.345166979, 2.4488834919999998, 2.3024619090000003, 2.429057526, 2.539924114, 2.712862763, 2.661827679, 2.58866833, 2.580611781, 2.532968767, "Cluster 2" ], [ "Late-demographic dividend", 2.749846218, 2.750524463, 2.94232719, 2.7954760419999998, 2.721888766, 2.5495596369999998, 2.589519016, 2.719474646, 2.735925695, 2.744432242, 2.775096107, 2.818204592, 2.932192624, 3.090526918, 3.408418886, 3.27272891, 3.265710729, 3.349820181, 3.376662873, 3.4269252519999998, "Cluster 2" ], [ "Least developed countries: UN classification", 1.52548196, 1.4297370919999999, 1.430388652, 1.471607242, 1.522391719, 1.465800489, 1.689041896, 1.690471391, 1.800899345, 1.880999571, 1.898899247, 2.157903627, 1.9138546930000002, 2.140700178, 2.172629716, 2.198171697, 2.177006608, 1.96354228, 2.031209935, 1.919877296, "Cluster 2" ], [ "Central African Republic", 1.363974592, 2.023371914, 1.216183896, 1.4170993580000002, 1.871718297, 2.1021468359999997, 1.863889207, 2.062251945, 2.0768119130000002, 1.845115241, 2.1146899390000002, 1.923990235, 2.036722449, 2.290508965, 1.497162132, 1.9771464330000001, 1.840226144, 1.7680298669999999, 1.913359234, 2.0569429830000003, "Cluster 2" ], [ "Low & middle income", 2.401016022, 2.351839879, 2.507134082, 2.4654399419999997, 2.427530862, 2.34705236, 2.376884847, 2.345132586, 2.384587803, 2.4076141769999997, 2.458114132, 2.506991643, 2.6052197390000003, 2.734475624, 3.005713015, 2.869481703, 2.894131937, 2.9566967039999996, 3.0130862210000005, 3.0383182860000004, "Cluster 2" ], [ "Lower middle income", 1.3821720169999998, 1.344572554, 1.355006184, 1.4310212219999998, 1.3888542769999999, 1.384144461, 1.4288831530000001, 1.380571025, 1.3841809880000002, 1.400072101, 1.4280820419999998, 1.478788431, 1.521790939, 1.559230946, 1.5884407409999999, 1.5131299669999998, 1.519120119, 1.5812649540000001, 1.639779694, 1.6358329619999998, "Cluster 2" ], [ "Middle East & North Africa", 2.423456889, 2.430438328, 2.520586788, 2.585412087, 2.614487018, 2.609441929, 2.869833259, 2.818405786, 2.735597223, 2.5723098419999997, 2.411219853, 2.45275055, 2.439045576, 2.352177305, 3.016616398, 2.714642506, 2.711284804, 2.895571978, 3.06782614, 3.224936356, "Cluster 2" ], [ "Middle East & North Africa (excluding high income)", 1.986615421, 2.000319073, 2.116533205, 2.180356186, 2.073848436, 2.15353996, 2.4061859269999997, 2.452578692, 2.404325255, 2.413375024, 2.277110381, 2.33316934, 2.38604766, 2.4840236190000002, 2.883655535, 2.674039179, 2.6663160009999998, 2.946036225, 3.1133615810000004, 3.195117055, "Cluster 2" ], [ "Middle East & North Africa (IDA & IBRD countries)", 1.986615421, 2.000319073, 2.116533205, 2.180356186, 2.073848436, 2.15353996, 2.4061859269999997, 2.452578692, 2.404325255, 2.413375024, 2.277110381, 2.33316934, 2.38604766, 2.4840236190000002, 2.883655535, 2.674039179, 2.6663160009999998, 2.946036225, 3.1133615810000004, 3.195117055, "Cluster 2" ], [ "Middle income", 2.412678871, 2.36362262, 2.5202424480000003, 2.477042313, 2.43762049, 2.356948176, 2.382038559, 2.349752613, 2.387242359, 2.4088153219999997, 2.458108718, 2.504454687, 2.60902103, 2.73939142, 3.0142344189999997, 2.872383447, 2.896995845, 2.962450623, 3.0212647560000003, 3.0467369210000004, "Cluster 2" ], [ "Pre-demographic dividend", 1.410676744, 1.300913774, 1.3471565680000002, 1.43327288, 1.489741772, 1.4058226130000002, 1.6053387190000001, 1.4385881090000001, 1.6097842219999998, 2.055879709, 1.894072295, 1.9102146830000002, 1.9152088569999999, 2.147427747, 2.25671329, 1.826936093, 1.921276365, 2.018579254, 2.092089478, 1.933374353, "Cluster 2" ], [ "South Asia", 1.03503164, 0.99799026, 1.0374988109999999, 1.070832413, 1.081228019, 1.0670523109999999, 1.042238308, 1.032538376, 0.9733766779999999, 1.018914387, 1.103442311, 1.103521575, 1.09051214, 1.151605829, 1.205501388, 1.181098088, 1.181152879, 1.19027209, 1.28224814, 1.3678991719999998, "Cluster 2" ], [ "Low income", 1.5301250290000001, 1.483895647, 1.5211285190000001, 1.657153759, 1.738222289, 1.7597896480000002, 2.034208573, 2.063321574, 2.217968593, 2.32876762, 2.458480802, 2.691171989, 2.317963439, 2.365497375, 2.4214922619999997, 2.642192573, 2.6593637230000002, 2.511732098, 2.394346629, 2.43910583, "Cluster 2" ], [ "Mauritania", 2.230334388, 1.3288083929999999, 1.49219146, 2.084762022, 2.901813013, 2.770993523, 1.879560462, 2.862060366, 2.179218351, 2.464112525, 2.033356056, 1.4476164319999998, 1.6517913519999998, 1.3545647330000001, 1.79980274, 1.52105378, 1.279141378, 1.370247011, 1.726038803, 1.871016263, "Cluster 2" ], [ "Zambia", 2.152488857, 2.484677806, 2.585239318, 3.1339650839999997, 3.403697035, 3.7198999230000003, 3.5265592110000004, 4.018109627, 4.18766916, 3.65708439, 3.9569790069999997, 2.75584562, 1.885822023, 2.18994158, 2.261667785, 2.27995642, 2.148931957, 2.536370459, 2.7654047189999997, 2.760094545, "Cluster 2" ], [ "Comoros", 2.8797862060000003, 2.7139497039999996, 2.584925576, 2.185036147, 1.964426649, 1.5227230969999999, 1.0946753390000001, 1.6697581019999999, 1.815474839, 2.010438445, 2.274051852, 2.5071515140000002, 2.80299141, 3.094532063, 1.72121212, 1.454408898, 1.656759335, 2.646604021, 2.003193245, 2.2173203519999998, "Cluster 2" ], [ "Yemen, Rep.", 1.358739823, 1.644500639, 1.898410163, 2.324037809, 2.127391156, 2.2352856269999997, 2.294180651, 2.142648503, 2.1817307269999997, 1.85433054, 1.5511169759999999, 1.5216019440000002, 1.462789576, 1.5650183009999998, 1.3366978040000002, 1.299130895, 1.3504469030000001, 1.5716278190000001, 1.410009971, 1.271870986, "Cluster 2" ], [ "India", 1.051510963, 1.006714181, 1.072536175, 1.104334395, 1.130458988, 1.1124430090000001, 1.0779961820000001, 1.025761987, 0.984930506, 1.022681766, 1.1342577, 1.110610623, 1.099600724, 1.162740942, 1.2209710809999998, 1.161015809, 1.175376637, 1.183872748, 1.2868865840000001, 1.4072376180000001, "Cluster 2" ], [ "Indonesia", 0.708979047, 0.726782129, 0.676852206, 0.7080650270000001, 0.772645557, 0.72468259, 0.963565797, 0.884272738, 1.015301176, 0.9348711359999999, 0.803211001, 0.912583094, 1.126425894, 1.005797618, 1.019549421, 1.03300414, 1.028914047, 1.147736521, 1.153628987, 1.0755363009999999, "Cluster 2" ], [ "Iran, Islamic Rep.", 1.6760716930000001, 1.725678443, 1.942216566, 2.137651028, 1.86003165, 1.8631224999999998, 2.194736416, 2.189274716, 2.348239338, 2.23931692, 2.333458198, 2.568090196, 2.4239648469999997, 2.437820381, 2.879141091, 2.684682081, 2.4790332630000003, 2.687600161, 2.7340401539999997, 2.840802145, "Cluster 2" ], [ "Jamaica", 2.224280687, 2.859074529, 3.354873879, 3.383751914, 2.711113592, 3.220452714, 2.449632293, 2.787349228, 2.304267888, 2.723855098, 1.9858449269999998, 2.3102109090000003, 2.5349200819999997, 2.893671205, 2.8937382119999997, 2.99010608, 2.7952228110000004, 3.273760445, 3.380134876, 2.8085780330000003, "Cluster 2" ], [ "Kazakhstan", 2.953489978, 2.759064102, 3.0026158069999997, 3.092985258, 2.296107627, 2.1193106530000003, 1.965795165, 1.933120902, 2.014321414, 2.294666524, 2.521541794, 2.3057194, 1.784132566, 2.262578318, 2.651119229, 2.527218011, 2.271552738, 2.40821469, 2.18920504, 2.3679030869999997, "Cluster 2" ], [ "Kenya", 1.969355371, 1.662980154, 1.599507906, 1.994903268, 1.67225462, 2.166725101, 2.067304171, 1.9431644419999998, 1.9281390840000001, 1.7957208980000001, 1.845407496, 1.624314663, 1.596858528, 1.40330995, 1.641624369, 1.418735549, 2.623533409, 3.3229374480000002, 3.3464041819999997, 3.5038660580000003, "Cluster 2" ], [ "Korea, Rep.", 1.37837002, 1.567106233, 1.661384573, 1.896960077, 2.0360782019999997, 2.069427846, 2.6287877219999998, 2.496197951, 2.567924451, 2.604738563, 2.8184627260000004, 3.145604415, 3.279317912, 3.364369569, 3.756141758, 3.855133327, 3.8213452130000003, 3.851691628, 3.909878493, 3.985248041, "Cluster 2" ], [ "Kuwait", 3.0793817160000003, 2.75312334, 2.9512544810000003, 3.5051093939999998, 2.9118429619999997, 1.9074589430000002, 2.938514016, 2.8451164789999996, 2.591638049, 2.197676413, 1.8984359730000002, 1.826202921, 1.678892606, 1.511862693, 3.3709338939999998, 2.334489191, 2.255683318, 2.187222399, 2.1656254280000002, 2.614422533, "Cluster 2" ], [ "Kyrgyz Republic", 3.0586966139999996, 2.518306598, 2.561680082, 2.5370569880000002, 2.251547927, 2.0709018009999998, 1.96892384, 2.149216502, 2.056844, 2.275178259, 2.38059842, 3.276997235, 3.530000425, 3.1283246069999997, 3.785352567, 3.71014072, 3.701089568, 4.197243855, 3.8799367869999997, 3.639437553, "Cluster 2" ], [ "Lao PDR", 2.179347721, 1.827522348, 2.07175976, 1.8517304780000001, 1.111702922, 1.13056391, 1.177790717, 1.0828706259999998, 1.2709968, 0.801898709, 0.7346070859999999, 1.1470211890000002, 1.029730057, 1.001469523, 1.8583031069999998, 1.278180688, 0.835809612, 0.79224628, 0.964872836, 0.942733752, "Cluster 2" ], [ "Libya", 1.5145279969999998, 1.662741707, 1.7901981919999999, 1.884513389, 1.6503777830000002, 1.6598308590000002, 2.210293692, 3.056726273, 2.692002637, 2.276618671, 1.7491174269999998, 1.640166807, 1.748097339, 1.382407555, 2.178180015, 2.136789648, 3.019999999, 3.019999999, 3.019999999, 3.6540791589999997, "Cluster 2" ], [ "Madagascar", 1.4415262030000002, 1.9149721119999998, 2.14802212, 1.96133518, 2.0399136369999997, 2.573304228, 2.808515662, 2.7432138360000002, 2.260174188, 2.43699522, 2.621449986, 2.817711615, 2.7398218389999998, 2.41891842, 2.408212919, 2.606558609, 2.4358722790000003, 1.8161052969999998, 2.560444941, 1.473414605, "Cluster 2" ], [ "Malaysia", 1.673580101, 1.693100127, 1.503468834, 1.6234893730000002, 1.682393231, 1.6935325469999998, 1.990382325, 1.95887394, 2.362041422, 2.118040539, 1.69082761, 2.011816692, 1.961867672, 1.936706363, 2.336639744, 2.2862965859999997, 2.135913733, 2.21523329, 2.2031471540000003, 2.300290016, "Cluster 2" ], [ "Mali", 2.627422294, 2.9937876169999997, 2.478276148, 2.136752933, 1.819396693, 2.069921322, 2.872448632, 2.538877445, 2.757198984, 3.091886553, 3.0385294910000002, 3.164633564, 3.3665769610000003, 3.1356973139999997, 3.148995784, 2.807459661, 3.0152463110000003, 2.250262582, 1.134273081, 1.568172106, "Cluster 2" ], [ "China", 1.780381954, 1.763716129, 1.7806565580000002, 1.8120753459999999, 1.8349422359999998, 1.7598434680000001, 1.621284224, 1.7146722380000001, 1.746529994, 1.793429835, 1.805920306, 1.83853832, 2.026592106, 2.292123452, 2.664482629, 2.653820098, 2.8106526560000002, 2.945813766, 3.005601408, 3.095174286, "Cluster 2" ], [ "Guinea-Bissau", 1.59182256, 2.107388011, 2.249324138, 2.207081665, 1.458689029, 0.5159652370000001, 0.483604876, 1.29016916, 1.2961535690000001, 0.8552961729999999, 1.083538194, 1.068546513, 1.363201444, 1.1577875359999998, 1.916627082, 1.849453411, 1.0469749320000001, 1.591370587, 1.6250123669999998, 1.145122307, "Cluster 2" ], [ "Haiti", 2.700778316, 2.4568022959999998, 2.444218128, 2.031842786, 1.696652901, 1.679556587, 1.472578763, 1.411106475, 1.585349102, 2.029269522, 0.938494956, 1.355593535, 1.326609423, 1.355999841, 1.3726482, 1.410583252, 1.80632117, 0.980271294, 1.724541255, 1.559516418, "Cluster 2" ], [ "Guatemala", 1.568251834, 1.4740888109999999, 1.652352634, 1.687897756, 1.8225683169999998, 1.906287984, 2.1653825419999997, 2.126950411, 2.250780088, 2.18862221, 2.151933847, 2.389327876, 2.26818626, 2.319787972, 2.516993404, 2.375496937, 2.15314798, 2.14774653, 2.321889304, 2.334729015, "Cluster 2" ], [ "Congo, Dem. Rep.", 0.151469658, 0.113020059, 0.20486781199999998, 0.178185156, 0.24769671199999999, 0.044703612000000004, 0.14417975, 0.160080405, 0.700026844, 0.71835464, 0.752462162, 0.938991328, 1.209434345, 2.099872761, 2.362979061, 1.062595613, 1.255268552, 1.687173628, 1.3234417509999998, 1.59835647, "Cluster 2" ], [ "Congo, Rep.", 1.875942346, 1.7216115490000001, 1.9118363180000002, 2.218401855, 1.752764882, 1.222592062, 1.334532489, 1.287959153, 1.300179166, 1.369675105, 1.434608509, 1.494032765, 1.545764133, 1.238592875, 1.14114182, 1.386578972, 1.977375259, 3.149421373, 4.05731117, 4.2119208519999995, "Cluster 2" ], [ "Cote d'Ivoire", 1.645869281, 1.8541070080000002, 2.003289854, 1.8888131119999998, 1.799667406, 1.7880357040000001, 1.290257864, 1.40860098, 1.338333609, 1.4716744259999999, 1.269719496, 1.358403825, 1.4282131319999998, 1.528626424, 1.6968101519999998, 1.6761721680000001, 1.635696974, 1.885045493, 1.7965878830000002, 1.6785384909999999, "Cluster 2" ], [ "Cyprus", 1.697054395, 1.774813392, 1.948338097, 2.338116275, 2.388126932, 2.402830234, 2.449259438, 2.7545184480000002, 3.082626861, 2.813460787, 2.662677211, 2.663821238, 2.5780400130000003, 2.8508256060000003, 3.3114723930000003, 3.425307365, 3.5076350819999997, 3.4116037089999995, 3.4707913969999997, 3.332019222, "Cluster 2" ], [ "Dominican Republic", 1.155220766, 1.2382753, 1.48835433, 1.7989108280000001, 2.00188919, 2.192495065, 1.925895905, 2.008738541, 1.8208773669999998, 1.3886192519999998, 1.4859490469999999, 1.781605827, 1.9925087609999999, 2.051277828, 2.245560221, 2.263964847, 2.604386077, 2.7018122589999995, 2.623467358, 2.927375648, "Cluster 2" ], [ "Ecuador", 1.8815244230000001, 2.204202458, 1.9874813930000002, 1.400740525, 1.3751416319999998, 0.8960031829999999, 1.228463152, 1.428875973, 1.425714581, 1.4293144180000001, 1.309875442, 1.423655771, 1.5062408999999999, 1.630354665, 2.186591275, 2.4594076240000002, 2.597380991, 2.957292999, 3.858385301, 4.508156573, "Cluster 2" ], [ "Egypt, Arab Rep.", 1.6460250419999998, 1.620664666, 1.785539455, 1.969811265, 2.1234134, 2.246958395, 2.327558282, 2.403817061, 2.068547965, 1.985911495, 1.9850409880000002, 2.287519277, 2.0466957359999998, 2.0297271969999997, 2.058126846, 1.872592845, 1.990804136, 1.9092313269999999, 2.057468101, 2.155384501, "Cluster 2" ], [ "Equatorial Guinea", 3.883858135, 2.7329980910000002, 2.251245641, 3.055954265, 1.922256608, 2.166271678, 1.335525197, 1.111721515, 1.52759716, 1.3524546240000002, 0.9139821140000001, 1.4674520659999999, 1.640828358, 1.795079572, 4.461108402, 3.057171112, 2.596654331, 3.325881938, 2.961789903, 2.932710442, "Cluster 2" ], [ "Eritrea", 2.171974402, 1.321100351, 1.770926971, 1.85142628, 1.996568895, 1.588511165, 1.386781377, 1.6404693430000001, 1.291688995, 1.236014558, 1.095939139, 1.4704505280000002, 1.490338129, 1.9314296069999999, 1.397960224, 1.424863559, 1.40782257, 1.383976464, 1.37826626, 1.527464004, "Cluster 2" ], [ "Ethiopia", 1.201089905, 1.113331724, 1.308283107, 1.634136008, 1.842742815, 2.382655413, 2.230818205, 2.550281355, 2.556368908, 2.37364068, 2.580334349, 2.529405628, 2.571477099, 2.221322189, 2.421519695, 3.716736035, 3.735155728, 3.3105951260000004, 2.953637718, 2.86756675, "Cluster 2" ], [ "Fiji", 2.463687222, 2.643610757, 2.8924071430000002, 2.6044336130000003, 2.50533762, 3.2355711560000002, 2.628178355, 2.8544881930000003, 2.7002647580000003, 2.88766334, 2.936055816, 3.012361986, 2.7919826010000004, 2.780329042, 2.953906158, 2.9652059360000003, 2.677144195, 2.762148643, 2.902243871, 2.95320811, "Cluster 2" ], [ "Gabon", 1.257445299, 1.28647559, 1.192176302, 1.731343904, 1.213987698, 1.154856156, 1.285837405, 1.207290008, 1.467581307, 1.36059829, 1.114980978, 1.235086135, 1.2669780659999998, 1.076241407, 1.5480996480000002, 2.44092455, 2.103287948, 2.210201203, 2.931829623, 2.350580925, "Cluster 2" ], [ "Gambia, The", 1.041104569, 0.8962045120000001, 0.921290897, 1.194823096, 1.25261532, 1.234866709, 1.55374665, 1.4073568930000002, 2.1239748780000003, 2.5148502390000003, 2.8975990080000003, 3.244630936, 3.40312534, 3.527012899, 3.482328264, 3.4330868760000004, 3.735121027, 3.672212762, 4.181628453, 5.045612515, "Cluster 2" ], [ "Georgia", 0.267281215, 0.8742158040000001, 1.491279099, 1.195657068, 1.140527412, 1.180608888, 1.388194366, 1.400350039, 1.25729464, 1.307242467, 1.648504578, 1.7716621019999998, 1.449623425, 1.7799744119999998, 2.270258573, 2.2899291330000002, 1.7006243840000002, 1.210348913, 1.276120238, 1.552730538, "Cluster 2" ], [ "Ghana", 1.6228713819999998, 2.0189271019999997, 1.4356055330000002, 1.7727537830000002, 1.5933775380000001, 1.4980943409999998, 2.045003688, 1.508850229, 1.580562376, 2.399043819, 2.923944957, 3.0442281560000004, 3.729887891, 3.223054494, 3.6749633619999997, 3.829376748, 3.5755204860000003, 3.140675827, 3.242160133, 2.128885085, "Cluster 2" ], [ "Guinea", 1.24440635, 0.7692242340000001, 0.753971712, 0.9485828709999999, 1.0340789959999999, 1.095939452, 1.27041596, 1.313300227, 1.313311747, 0.879682253, 0.554865842, 0.66542757, 0.418226466, 0.7846244029999999, 1.346498634, 2.011768888, 1.977158975, 2.0989461769999997, 2.378242841, 2.7362447810000003, "Cluster 2" ] ], "hovertemplate": "Cluster=%{customdata[21]}
Country Name=%{customdata[0]}
1995=%{customdata[1]}
1996=%{customdata[2]}
1997=%{customdata[3]}
1998=%{customdata[4]}
1999=%{customdata[5]}
2000=%{customdata[6]}
2001=%{customdata[7]}
2002=%{customdata[8]}
2003=%{customdata[9]}
2004=%{customdata[10]}
2005=%{customdata[11]}
2006=%{customdata[12]}
2007=%{customdata[13]}
2008=%{customdata[14]}
2009=%{customdata[15]}
2010=%{customdata[16]}
2011=%{customdata[17]}
2012=%{customdata[18]}
2013=%{customdata[19]}
2014=%{customdata[20]}", "legendgroup": "Cluster 2", "marker": { "color": "#00cc96" }, "name": "Cluster 2", "notched": true, "offsetgroup": "Cluster 2", "showlegend": false, "type": "box", "x": [ "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2", "Cluster 2" ], "xaxis": "x2", "yaxis": "y2" }, { "alignmentgroup": "True", "bingroup": "x", "hovertemplate": "Cluster=%{x}
count=%{y}", "legendgroup": "Cluster 3", "marker": { "color": "#ab63fa", "opacity": 0.7 }, "name": "Cluster 3", "offsetgroup": "Cluster 3", "orientation": "v", "showlegend": true, "type": "histogram", "x": [ "Cluster 3", "Cluster 3", "Cluster 3" ], "xaxis": "x", "yaxis": "y" }, { "alignmentgroup": "True", "customdata": [ [ "Nauru", 12.33493098, 11.59428355, 11.82601857, 12.56498453, 12.337983900000001, 12.54768588, 13.31280697, 14.53541812, 13.45467078, 10.64962726, 11.61777519, 12.57633671, 18.10282404, 15.60670301, 8.727534152, 8.454551816, 7.110556956, 6.523965614, 4.192163552, 2.8676663239999995, "Cluster 3" ], [ "Tuvalu", 7.960185727000001, 11.27466332, 8.08774651, 8.614014716, 9.221982956, 15.66666666, 17.26923077, 14.386206900000001, 21.65409429, 16.74897207, 18.23437732, 19.25675216, 16.85609763, 13.26834375, 12.69334417, 16.62857143, 16.84210527, 13.64102565, 16.475, 16.40476191, "Cluster 3" ], [ "Marshall Islands", 28.04978525, 16.67889286, 17.16813342, 15.64522955, 15.42742281, 19.24043333, 16.07197043, 14.8351456, 14.21128802, 15.09092986, 14.67971014, 17.05555555, 17.592, 16.48169934, 16.02894737, 14.39817073, 14.271676300000001, 13.90652174, 14.551897899999998, 14.44916839, "Cluster 3" ] ], "hovertemplate": "Cluster=%{customdata[21]}
Country Name=%{customdata[0]}
1995=%{customdata[1]}
1996=%{customdata[2]}
1997=%{customdata[3]}
1998=%{customdata[4]}
1999=%{customdata[5]}
2000=%{customdata[6]}
2001=%{customdata[7]}
2002=%{customdata[8]}
2003=%{customdata[9]}
2004=%{customdata[10]}
2005=%{customdata[11]}
2006=%{customdata[12]}
2007=%{customdata[13]}
2008=%{customdata[14]}
2009=%{customdata[15]}
2010=%{customdata[16]}
2011=%{customdata[17]}
2012=%{customdata[18]}
2013=%{customdata[19]}
2014=%{customdata[20]}", "legendgroup": "Cluster 3", "marker": { "color": "#ab63fa" }, "name": "Cluster 3", "notched": true, "offsetgroup": "Cluster 3", "showlegend": false, "type": "box", "x": [ "Cluster 3", "Cluster 3", "Cluster 3" ], "xaxis": "x2", "yaxis": "y2" } ], "layout": { "barmode": "relative", "legend": { "title": { "text": "Cluster" }, "tracegroupgap": 0 }, "margin": { "t": 60 }, "template": { "data": { "bar": [ { "error_x": { "color": "#2a3f5f" }, "error_y": { "color": "#2a3f5f" }, "marker": { "line": { "color": "#E5ECF6", "width": 0.5 } }, "type": "bar" } ], "barpolar": [ { "marker": { "line": { "color": "#E5ECF6", "width": 0.5 } }, "type": "barpolar" } ], "carpet": [ { "aaxis": { "endlinecolor": "#2a3f5f", "gridcolor": "white", "linecolor": "white", "minorgridcolor": "white", "startlinecolor": "#2a3f5f" }, "baxis": { "endlinecolor": "#2a3f5f", "gridcolor": "white", "linecolor": "white", "minorgridcolor": "white", "startlinecolor": "#2a3f5f" }, "type": "carpet" } ], "choropleth": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "type": "choropleth" } ], "contour": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "contour" } ], "contourcarpet": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "type": "contourcarpet" } ], "heatmap": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "heatmap" } ], "heatmapgl": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "heatmapgl" } ], "histogram": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "histogram" } ], "histogram2d": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "histogram2d" } ], "histogram2dcontour": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "histogram2dcontour" } ], "mesh3d": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "type": "mesh3d" } ], "parcoords": [ { "line": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "parcoords" } ], "pie": [ { "automargin": true, "type": "pie" } ], "scatter": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatter" } ], "scatter3d": [ { "line": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatter3d" } ], "scattercarpet": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattercarpet" } ], "scattergeo": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattergeo" } ], "scattergl": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattergl" } ], "scattermapbox": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scattermapbox" } ], "scatterpolar": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatterpolar" } ], "scatterpolargl": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatterpolargl" } ], "scatterternary": [ { "marker": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "type": "scatterternary" } ], "surface": [ { "colorbar": { "outlinewidth": 0, "ticks": "" }, "colorscale": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "type": "surface" } ], "table": [ { "cells": { "fill": { "color": "#EBF0F8" }, "line": { "color": "white" } }, "header": { "fill": { "color": "#C8D4E3" }, "line": { "color": "white" } }, "type": "table" } ] }, "layout": { "annotationdefaults": { "arrowcolor": "#2a3f5f", "arrowhead": 0, "arrowwidth": 1 }, "coloraxis": { "colorbar": { "outlinewidth": 0, "ticks": "" } }, "colorscale": { "diverging": [ [ 0, "#8e0152" ], [ 0.1, "#c51b7d" ], [ 0.2, "#de77ae" ], [ 0.3, "#f1b6da" ], [ 0.4, "#fde0ef" ], [ 0.5, "#f7f7f7" ], [ 0.6, "#e6f5d0" ], [ 0.7, "#b8e186" ], [ 0.8, "#7fbc41" ], [ 0.9, "#4d9221" ], [ 1, "#276419" ] ], "sequential": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ], "sequentialminus": [ [ 0, "#0d0887" ], [ 0.1111111111111111, "#46039f" ], [ 0.2222222222222222, "#7201a8" ], [ 0.3333333333333333, "#9c179e" ], [ 0.4444444444444444, "#bd3786" ], [ 0.5555555555555556, "#d8576b" ], [ 0.6666666666666666, "#ed7953" ], [ 0.7777777777777778, "#fb9f3a" ], [ 0.8888888888888888, "#fdca26" ], [ 1, "#f0f921" ] ] }, "colorway": [ "#636efa", "#EF553B", "#00cc96", "#ab63fa", "#FFA15A", "#19d3f3", "#FF6692", "#B6E880", "#FF97FF", "#FECB52" ], "font": { "color": "#2a3f5f" }, "geo": { "bgcolor": "white", "lakecolor": "white", "landcolor": "#E5ECF6", "showlakes": true, "showland": true, "subunitcolor": "white" }, "hoverlabel": { "align": "left" }, "hovermode": "closest", "mapbox": { "style": "light" }, "paper_bgcolor": "white", "plot_bgcolor": "#E5ECF6", "polar": { "angularaxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" }, "bgcolor": "#E5ECF6", "radialaxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" } }, "scene": { "xaxis": { "backgroundcolor": "#E5ECF6", "gridcolor": "white", "gridwidth": 2, "linecolor": "white", "showbackground": true, "ticks": "", "zerolinecolor": "white" }, "yaxis": { "backgroundcolor": "#E5ECF6", "gridcolor": "white", "gridwidth": 2, "linecolor": "white", "showbackground": true, "ticks": "", "zerolinecolor": "white" }, "zaxis": { "backgroundcolor": "#E5ECF6", "gridcolor": "white", "gridwidth": 2, "linecolor": "white", "showbackground": true, "ticks": "", "zerolinecolor": "white" } }, "shapedefaults": { "line": { "color": "#2a3f5f" } }, "ternary": { "aaxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" }, "baxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" }, "bgcolor": "#E5ECF6", "caxis": { "gridcolor": "white", "linecolor": "white", "ticks": "" } }, "title": { "x": 0.05 }, "xaxis": { "automargin": true, "gridcolor": "white", "linecolor": "white", "ticks": "", "title": { "standoff": 15 }, "zerolinecolor": "white", "zerolinewidth": 2 }, "yaxis": { "automargin": true, "gridcolor": "white", "linecolor": "white", "ticks": "", "title": { "standoff": 15 }, "zerolinecolor": "white", "zerolinewidth": 2 } } }, "xaxis": { "anchor": "y", "categoryarray": [ "Cluster 0", "Cluster 1", "Cluster 2", "Cluster 3" ], "categoryorder": "array", "domain": [ 0, 1 ], "title": { "text": "Cluster" } }, "xaxis2": { "anchor": "y2", "domain": [ 0, 1 ], "matches": "x", "showgrid": true, "showticklabels": false }, "yaxis": { "anchor": "x", "domain": [ 0, 0.7326 ], "title": { "text": "count" } }, "yaxis2": { "anchor": "x2", "domain": [ 0.7426, 1 ], "matches": "y2", "showgrid": false, "showline": false, "showticklabels": false, "ticks": "" } } }, "text/html": [ "
\n", " \n", " \n", "
\n", " \n", "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "plot_model(kmeans, plot = 'distribution')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 6. Predict Model" ] }, { "cell_type": "code", "execution_count": 15, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
Country Name199519961997199819992000200120022003...200620072008200920102011201220132014Cluster
0Arab World2.0048682.0146022.0713092.1777122.3310002.3335962.5887512.5402382.450415...2.1330382.1668722.1012332.8300672.4896312.5395702.7112622.8954273.073161Cluster 2
1Caribbean small states2.8015182.8566842.9971572.9894512.7678582.8267522.6799692.8886932.740593...2.6509002.7906652.8229133.4086513.2640643.0876533.3143033.3184323.260012Cluster 2
2Central Europe and the Baltics4.6785284.7532094.6045744.4999884.6790824.5397114.6662724.9001965.100249...4.8414504.8090575.0547855.3949215.2843805.0962125.0413175.0292665.017717Cluster 0
3Early-demographic dividend2.2031642.1566322.2273112.3641002.4543942.4505552.5270812.3477022.363263...2.3698842.3852512.4051262.7012602.5071312.4954912.4973402.5867012.665603Cluster 2
4East Asia & Pacific4.4290904.2031524.2443514.4539844.6269204.6888494.6847904.6135374.635098...4.3671464.2973944.4348484.8652414.7758174.8717274.8668694.6432214.571448Cluster 0
\n", "

5 rows × 22 columns

\n", "
" ], "text/plain": [ " Country Name 1995 1996 1997 1998 \\\n", "0 Arab World 2.004868 2.014602 2.071309 2.177712 \n", "1 Caribbean small states 2.801518 2.856684 2.997157 2.989451 \n", "2 Central Europe and the Baltics 4.678528 4.753209 4.604574 4.499988 \n", "3 Early-demographic dividend 2.203164 2.156632 2.227311 2.364100 \n", "4 East Asia & Pacific 4.429090 4.203152 4.244351 4.453984 \n", "\n", " 1999 2000 2001 2002 2003 ... 2006 2007 \\\n", "0 2.331000 2.333596 2.588751 2.540238 2.450415 ... 2.133038 2.166872 \n", "1 2.767858 2.826752 2.679969 2.888693 2.740593 ... 2.650900 2.790665 \n", "2 4.679082 4.539711 4.666272 4.900196 5.100249 ... 4.841450 4.809057 \n", "3 2.454394 2.450555 2.527081 2.347702 2.363263 ... 2.369884 2.385251 \n", "4 4.626920 4.688849 4.684790 4.613537 4.635098 ... 4.367146 4.297394 \n", "\n", " 2008 2009 2010 2011 2012 2013 2014 \\\n", "0 2.101233 2.830067 2.489631 2.539570 2.711262 2.895427 3.073161 \n", "1 2.822913 3.408651 3.264064 3.087653 3.314303 3.318432 3.260012 \n", "2 5.054785 5.394921 5.284380 5.096212 5.041317 5.029266 5.017717 \n", "3 2.405126 2.701260 2.507131 2.495491 2.497340 2.586701 2.665603 \n", "4 4.434848 4.865241 4.775817 4.871727 4.866869 4.643221 4.571448 \n", "\n", " Cluster \n", "0 Cluster 2 \n", "1 Cluster 2 \n", "2 Cluster 0 \n", "3 Cluster 2 \n", "4 Cluster 0 \n", "\n", "[5 rows x 22 columns]" ] }, "execution_count": 15, "metadata": {}, "output_type": "execute_result" } ], "source": [ "pred_new = predict_model(kmeans, data=data)\n", "pred_new.head()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 7. Save / Load Model" ] }, { "cell_type": "code", "execution_count": 16, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Transformation Pipeline and Model Succesfully Saved\n" ] } ], "source": [ "save_model(kmeans, model_name='kmeans')" ] }, { "cell_type": "code", "execution_count": 17, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Transformation Pipeline and Model Sucessfully Loaded\n", "[Pipeline(memory=None,\n", " steps=[('dtypes',\n", " DataTypes_Auto_infer(categorical_features=[],\n", " display_types=True,\n", " features_todrop=['Country Name'],\n", " ml_usecase='regression',\n", " numerical_features=[],\n", " target='dummy_target',\n", " time_features=[])),\n", " ('imputer',\n", " Simple_Imputer(categorical_strategy='not_available',\n", " numeric_strategy='mean',\n", " target_variable=None)),\n", " ('new_levels1',\n", " New_...\n", " target='dummy_target')),\n", " ('feature_time',\n", " Make_Time_Features(list_of_features=None, time_feature=[])),\n", " ('group', Empty()), ('scaling', Empty()),\n", " ('P_transform', Empty()), ('binn', Empty()),\n", " ('fix_perfect', Empty()), ('rem_outliers', Empty()),\n", " ('dummy', Dummify(target='dummy_target')),\n", " ('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\n", " ('pca', Empty())],\n", " verbose=False), KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\n", " n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\n", " random_state=123, tol=0.0001, verbose=0)]\n" ] } ], "source": [ "loaded_kmeans = load_model('kmeans')\n", "print(loaded_kmeans)" ] }, { "cell_type": "code", "execution_count": 18, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
Pipeline(memory=None,\n",
       "         steps=[('dtypes',\n",
       "                 DataTypes_Auto_infer(categorical_features=[],\n",
       "                                      display_types=True,\n",
       "                                      features_todrop=['Country Name'],\n",
       "                                      ml_usecase='regression',\n",
       "                                      numerical_features=[],\n",
       "                                      target='dummy_target',\n",
       "                                      time_features=[])),\n",
       "                ('imputer',\n",
       "                 Simple_Imputer(categorical_strategy='not_available',\n",
       "                                numeric_strategy='mean',\n",
       "                                target_variable=None)),\n",
       "                ('new_levels1',\n",
       "                 New_...\n",
       "                                                    target='dummy_target')),\n",
       "                ('feature_time',\n",
       "                 Make_Time_Features(list_of_features=None, time_feature=[])),\n",
       "                ('group', Empty()), ('scaling', Empty()),\n",
       "                ('P_transform', Empty()), ('binn', Empty()),\n",
       "                ('fix_perfect', Empty()), ('rem_outliers', Empty()),\n",
       "                ('dummy', Dummify(target='dummy_target')),\n",
       "                ('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\n",
       "                ('pca', Empty())],\n",
       "         verbose=False)
DataTypes_Auto_infer(features_todrop=['Country Name'], ml_usecase='regression',\n",
       "                     target='dummy_target')
Simple_Imputer(categorical_strategy='not_available', numeric_strategy='mean',\n",
       "               target_variable=None)
New_Catagorical_Levels_in_TestData(replacement_strategy='least frequent',\n",
       "                                   target='dummy_target')
Empty()
Empty()
Empty()
Empty()
New_Catagorical_Levels_in_TestData(replacement_strategy='least frequent',\n",
       "                                   target='dummy_target')
Make_Time_Features(list_of_features=None)
Empty()
Empty()
Empty()
Empty()
Empty()
Empty()
Dummify(target='dummy_target')
Clean_Colum_Names()
Empty()
Empty()
" ], "text/plain": [ "Pipeline(memory=None,\n", " steps=[('dtypes',\n", " DataTypes_Auto_infer(categorical_features=[],\n", " display_types=True,\n", " features_todrop=['Country Name'],\n", " ml_usecase='regression',\n", " numerical_features=[],\n", " target='dummy_target',\n", " time_features=[])),\n", " ('imputer',\n", " Simple_Imputer(categorical_strategy='not_available',\n", " numeric_strategy='mean',\n", " target_variable=None)),\n", " ('new_levels1',\n", " New_...\n", " target='dummy_target')),\n", " ('feature_time',\n", " Make_Time_Features(list_of_features=None, time_feature=[])),\n", " ('group', Empty()), ('scaling', Empty()),\n", " ('P_transform', Empty()), ('binn', Empty()),\n", " ('fix_perfect', Empty()), ('rem_outliers', Empty()),\n", " ('dummy', Dummify(target='dummy_target')),\n", " ('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\n", " ('pca', Empty())],\n", " verbose=False)" ] }, "execution_count": 18, "metadata": {}, "output_type": "execute_result" } ], "source": [ "from sklearn import set_config\n", "set_config(display='diagram')\n", "loaded_kmeans[0]" ] }, { "cell_type": "code", "execution_count": 19, "metadata": {}, "outputs": [], "source": [ "from sklearn import set_config\n", "set_config(display='text')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 8. Deploy Model" ] }, { "cell_type": "code", "execution_count": 20, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Model Succesfully Deployed on AWS S3\n" ] } ], "source": [ "deploy_model(kmeans, model_name = 'kmeans-aws', authentication = {'bucket' : 'pycaret-test'})" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 9. Get Config / Set Config" ] }, { "cell_type": "code", "execution_count": 21, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
19951996199719981999200020012002200320042005200620072008200920102011201220132014
02.0048682.0146022.0713092.1777122.3310002.3335962.5887512.5402382.4504152.3149142.1342812.1330382.1668722.1012332.8300672.4896312.5395702.7112622.8954273.073161
12.8015182.8566842.9971572.9894512.7678582.8267522.6799692.8886932.7405932.8459712.6295802.6509002.7906652.8229133.4086513.2640643.0876533.3143033.3184323.260012
24.6785284.7532094.6045744.4999884.6790824.5397114.6662724.9001965.1002494.9136294.9708614.8414504.8090575.0547855.3949215.2843805.0962125.0413175.0292665.017717
32.2031642.1566322.2273112.3641002.4543942.4505552.5270812.3477022.3632632.3468242.3373472.3698842.3852512.4051262.7012602.5071312.4954912.4973402.5867012.665603
44.4290904.2031524.2443514.4539844.6269204.6888494.6847904.6135374.6350984.6266964.5662154.3671464.2973944.4348484.8652414.7758174.8717274.8668694.6432214.571448
\n", "
" ], "text/plain": [ " 1995 1996 1997 1998 1999 2000 2001 \\\n", "0 2.004868 2.014602 2.071309 2.177712 2.331000 2.333596 2.588751 \n", "1 2.801518 2.856684 2.997157 2.989451 2.767858 2.826752 2.679969 \n", "2 4.678528 4.753209 4.604574 4.499988 4.679082 4.539711 4.666272 \n", "3 2.203164 2.156632 2.227311 2.364100 2.454394 2.450555 2.527081 \n", "4 4.429090 4.203152 4.244351 4.453984 4.626920 4.688849 4.684790 \n", "\n", " 2002 2003 2004 2005 2006 2007 2008 \\\n", "0 2.540238 2.450415 2.314914 2.134281 2.133038 2.166872 2.101233 \n", "1 2.888693 2.740593 2.845971 2.629580 2.650900 2.790665 2.822913 \n", "2 4.900196 5.100249 4.913629 4.970861 4.841450 4.809057 5.054785 \n", "3 2.347702 2.363263 2.346824 2.337347 2.369884 2.385251 2.405126 \n", "4 4.613537 4.635098 4.626696 4.566215 4.367146 4.297394 4.434848 \n", "\n", " 2009 2010 2011 2012 2013 2014 \n", "0 2.830067 2.489631 2.539570 2.711262 2.895427 3.073161 \n", "1 3.408651 3.264064 3.087653 3.314303 3.318432 3.260012 \n", "2 5.394921 5.284380 5.096212 5.041317 5.029266 5.017717 \n", "3 2.701260 2.507131 2.495491 2.497340 2.586701 2.665603 \n", "4 4.865241 4.775817 4.871727 4.866869 4.643221 4.571448 " ] }, "execution_count": 21, "metadata": {}, "output_type": "execute_result" } ], "source": [ "X = get_config('X')\n", "X.head()" ] }, { "cell_type": "code", "execution_count": 22, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "123" ] }, "execution_count": 22, "metadata": {}, "output_type": "execute_result" } ], "source": [ "get_config('seed')" ] }, { "cell_type": "code", "execution_count": 23, "metadata": {}, "outputs": [], "source": [ "from pycaret.clustering import set_config\n", "set_config('seed', 999)" ] }, { "cell_type": "code", "execution_count": 24, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "999" ] }, "execution_count": 24, "metadata": {}, "output_type": "execute_result" } ], "source": [ "get_config('seed')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 10. Get System Logs" ] }, { "cell_type": "code", "execution_count": 25, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "['2020-07-29 09', '47', '14,652', 'INFO', 'PyCaret Regression Module']\n", "['2020-07-29 09', '47', '14,652', 'INFO', 'version pycaret-nightly-0.39']\n", "['2020-07-29 09', '47', '14,652', 'INFO', 'Initializing setup()']\n", "['2020-07-29 09', '47', '14,652', 'INFO', 'USI', 'e640']\n", "['2020-07-29 09', '47', '14,652', 'INFO', 'setup(data=(1338, 7), target=charges, train_size=0.7, sampling=True, sample_estimator=None, categorical_features=None, categorical_imputation=constant, ordinal_features=None,']\n", "['high_cardinality_features=None, high_cardinality_method=frequency, numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=None, normalize=False,']\n", "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None, remove_outliers=False, outliers_threshold=0.05,']\n", "['remove_multicollinearity=False, multicollinearity_threshold=0.9, remove_perfect_collinearity=False, create_clusters=False, cluster_iter=20,']\n", "['polynomial_features=False, polynomial_degree=2, trigonometry_features=False, polynomial_threshold=0.1, group_features=None,']\n", "['group_names=None, feature_selection=False, feature_selection_threshold=0.8, feature_interaction=False, feature_ratio=False, interaction_threshold=0.01, transform_target=False,']\n", "['transform_target_method=box-cox, data_split_shuffle=True, folds_shuffle=False, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", "['experiment_name=insurance1, log_plots=False, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", "['2020-07-29 09', '47', '14,653', 'INFO', 'Checking environment']\n", "['2020-07-29 09', '47', '14,653', 'INFO', 'python_version', '3.6.10']\n", "['2020-07-29 09', '47', '14,653', 'INFO', 'python_build', \"('default', 'May 7 2020 19\", '46', \"08')\"]\n", "['2020-07-29 09', '47', '14,653', 'INFO', 'machine', 'AMD64']\n", "['2020-07-29 09', '47', '14,653', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", "['2020-07-29 09', '47', '14,674', 'INFO', 'Memory', 'svmem(total=17032478720, available=5530103808, percent=67.5, used=11502374912, free=5530103808)']\n", "['2020-07-29 09', '47', '14,674', 'INFO', 'Physical Core', '4']\n", "['2020-07-29 09', '47', '14,674', 'INFO', 'Logical Core', '8']\n", "['2020-07-29 09', '47', '14,674', 'INFO', 'Checking libraries']\n", "['2020-07-29 09', '47', '14,674', 'INFO', 'pd==1.0.4']\n", "['2020-07-29 09', '47', '14,674', 'INFO', 'numpy==1.18.5']\n", "['2020-07-29 09', '47', '15,120', 'INFO', 'sklearn==0.23.1']\n", "['2020-07-29 09', '47', '15,204', 'INFO', 'xgboost==1.1.1']\n", "['2020-07-29 09', '47', '15,259', 'INFO', 'lightgbm==2.3.1']\n", "['2020-07-29 09', '47', '15,310', 'INFO', 'catboost==0.23.2']\n", "['2020-07-29 09', '47', '15,876', 'INFO', 'mlflow==1.8.0']\n", "['2020-07-29 09', '47', '15,877', 'INFO', 'Checking Exceptions']\n", "['2020-07-29 09', '47', '15,877', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '47', '15,877', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '47', '15,900', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '47', '18,284', 'INFO', 'Copying data for preprocessing']\n", "['2020-07-29 09', '47', '18,285', 'INFO', 'Declaring global variables']\n", "['2020-07-29 09', '47', '18,296', 'INFO', 'Declaring preprocessing parameters']\n", "['2020-07-29 09', '47', '18,296', 'INFO', 'Importing preprocessing module']\n", "['2020-07-29 09', '47', '19,149', 'INFO', 'Creating preprocessing pipeline']\n", "['2020-07-29 09', '47', '20,310', 'INFO', 'Preprocessing pipeline created successfully']\n", "['2020-07-29 09', '47', '20,310', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '20,310', 'INFO', 'Creating grid variables']\n", "['2020-07-29 09', '47', '20,311', 'INFO', 'Creating global containers']\n", "['2020-07-29 09', '47', '20,410', 'INFO', 'Logging experiment in MLFlow']\n", "['2020-07-29 09', '47', '20,692', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '20,693', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '20,702', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", "['2020-07-29 09', '47', '20,702', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '20,710', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '20,721', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), None]']\n", "['2020-07-29 09', '47', '20,721', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '20,722', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '20,809', 'INFO', 'create_model_container', '0']\n", "['2020-07-29 09', '47', '20,809', 'INFO', 'master_model_container', '0']\n", "['2020-07-29 09', '47', '20,809', 'INFO', 'display_container', '0']\n", "['2020-07-29 09', '47', '20,809', 'INFO', 'setup() succesfully completed......................................']\n", "['2020-07-29 09', '47', '32,141', 'INFO', 'Initializing compare_models()']\n", "['2020-07-29 09', '47', '32,141', 'INFO', 'compare_models(blacklist=None, whitelist=None, fold=5, round=4, sort=R2, n_select=1, turbo=True, verbose=True)']\n", "['2020-07-29 09', '47', '32,141', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '47', '32,141', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '47', '32,141', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '47', '32,174', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '47', '32,176', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '47', '32,186', 'INFO', 'Importing untrained models']\n", "['2020-07-29 09', '47', '32,187', 'INFO', 'Import successful']\n", "['2020-07-29 09', '47', '32,191', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '47', '32,192', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '47', '32,192', 'INFO', 'Initializing Linear Regression']\n", "['2020-07-29 09', '47', '32,198', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '32,206', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '32,210', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '32,212', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '32,212', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '32,229', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '32,235', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '32,239', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '32,240', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '32,241', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '32,248', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '32,254', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '32,257', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '32,259', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '32,260', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '32,266', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '32,271', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '32,275', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '32,276', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '32,277', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '32,282', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '32,288', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '32,291', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '32,293', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '32,293', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '32,302', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '32,302', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '32,313', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '32,365', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '32,366', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '32,366', 'INFO', 'save_model(model=LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '47', '32,366', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '32,371', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '32,376', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), None]']\n", "['2020-07-29 09', '47', '32,376', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '32,376', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '32,731', 'INFO', 'Initializing Lasso Regression']\n", "['2020-07-29 09', '47', '32,736', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '32,742', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '32,747', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '32,749', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '32,749', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '32,756', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '32,762', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '32,766', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '32,768', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '32,768', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '32,775', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '32,781', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '32,786', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '32,788', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '32,788', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '32,795', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '32,801', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '32,804', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '32,805', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '32,805', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '32,812', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '32,818', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '32,820', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '32,822', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '32,822', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '32,829', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '32,829', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '32,841', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '32,901', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '32,901', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '32,901', 'INFO', 'save_model(model=Lasso(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=1000,']\n", "['normalize=False, positive=False, precompute=False, random_state=123,']\n", "[\"selection='cyclic', tol=0.0001, warm_start=False), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '47', '32,901', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '32,907', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '32,912', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), Lasso(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=1000,']\n", "['normalize=False, positive=False, precompute=False, random_state=123,']\n", "[\"selection='cyclic', tol=0.0001, warm_start=False), None]\"]\n", "['2020-07-29 09', '47', '32,912', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '32,912', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '32,961', 'INFO', 'Initializing Ridge Regression']\n", "['2020-07-29 09', '47', '32,967', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '32,972', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '32,974', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '32,976', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '32,976', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '32,983', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '32,988', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '32,991', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '32,993', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '32,993', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,001', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '33,006', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,008', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,010', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,010', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,017', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '33,022', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,025', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,027', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,027', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,035', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '33,041', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,043', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,045', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,045', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,051', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '33,051', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '33,062', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '33,129', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '33,129', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '33,129', 'INFO', 'save_model(model=Ridge(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=None,']\n", "[\"normalize=False, random_state=123, solver='auto', tol=0.001), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '47', '33,129', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '33,134', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '33,139', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), Ridge(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=None,']\n", "[\"normalize=False, random_state=123, solver='auto', tol=0.001), None]\"]\n", "['2020-07-29 09', '47', '33,139', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '33,139', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '33,188', 'INFO', 'Initializing Elastic Net']\n", "['2020-07-29 09', '47', '33,194', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '33,200', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,203', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,205', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,205', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,212', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '33,219', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,222', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,225', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,225', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,232', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '33,237', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,241', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,243', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,243', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,251', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '33,255', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,260', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,262', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,262', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,270', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '33,277', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,280', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,283', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,283', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,291', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '33,291', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '33,302', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '33,367', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '33,368', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '33,368', 'INFO', 'save_model(model=ElasticNet(alpha=1.0, copy_X=True, fit_intercept=True, l1_ratio=0.5,']\n", "['max_iter=1000, normalize=False, positive=False, precompute=False,']\n", "[\"random_state=123, selection='cyclic', tol=0.0001, warm_start=False), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '47', '33,368', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '33,373', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '33,379', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), ElasticNet(alpha=1.0, copy_X=True, fit_intercept=True, l1_ratio=0.5,']\n", "['max_iter=1000, normalize=False, positive=False, precompute=False,']\n", "[\"random_state=123, selection='cyclic', tol=0.0001, warm_start=False), None]\"]\n", "['2020-07-29 09', '47', '33,379', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '33,379', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '33,465', 'INFO', 'Initializing Least Angle Regression']\n", "['2020-07-29 09', '47', '33,470', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '33,476', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,482', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,483', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,484', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,490', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '33,496', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,502', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,504', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,504', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,510', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '33,517', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,522', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,523', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,523', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,531', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '33,536', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,542', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,543', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,544', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,552', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '33,564', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,572', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,574', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,574', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,580', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '33,581', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '33,593', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '33,653', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '33,654', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '33,654', 'INFO', 'save_model(model=Lars(copy_X=True, eps=2.220446049250313e-16, fit_intercept=True, fit_path=True,']\n", "[\"jitter=None, n_nonzero_coefs=500, normalize=True, precompute='auto',\"]\n", "['random_state=None, verbose=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '47', '33,654', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '33,658', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '33,664', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), Lars(copy_X=True, eps=2.220446049250313e-16, fit_intercept=True, fit_path=True,']\n", "[\"jitter=None, n_nonzero_coefs=500, normalize=True, precompute='auto',\"]\n", "['random_state=None, verbose=False), None]']\n", "['2020-07-29 09', '47', '33,664', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '33,664', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '33,714', 'INFO', 'Initializing Lasso Least Angle Regression']\n", "['2020-07-29 09', '47', '33,720', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '33,728', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,733', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,734', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,734', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,739', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '33,745', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,750', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,752', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,752', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,758', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '33,764', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,768', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,770', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,770', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,775', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '33,780', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,784', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,786', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,786', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,792', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '33,798', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,802', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,803', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,803', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,809', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '33,810', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '33,821', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '33,878', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '33,878', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '33,878', 'INFO', 'save_model(model=LassoLars(alpha=1.0, copy_X=True, eps=2.220446049250313e-16, fit_intercept=True,']\n", "['fit_path=True, jitter=None, max_iter=500, normalize=True,']\n", "[\"positive=False, precompute='auto', random_state=None, verbose=False), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '47', '33,878', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '33,884', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '33,889', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), LassoLars(alpha=1.0, copy_X=True, eps=2.220446049250313e-16, fit_intercept=True,']\n", "['fit_path=True, jitter=None, max_iter=500, normalize=True,']\n", "[\"positive=False, precompute='auto', random_state=None, verbose=False), None]\"]\n", "['2020-07-29 09', '47', '33,889', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '33,890', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '33,946', 'INFO', 'Initializing Orthogonal Matching Pursuit']\n", "['2020-07-29 09', '47', '33,952', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '33,961', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,964', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,966', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,966', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,974', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '33,983', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '33,985', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '33,987', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '33,988', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '33,997', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '34,002', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,006', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,008', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,008', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,017', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '34,023', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,026', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,029', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,029', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,037', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '34,044', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,048', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,051', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,051', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,058', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '34,058', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '34,073', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '34,193', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '34,193', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '34,194', 'INFO', 'save_model(model=OrthogonalMatchingPursuit(fit_intercept=True, n_nonzero_coefs=None,']\n", "[\"normalize=True, precompute='auto', tol=None), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '47', '34,194', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '34,202', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '34,211', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), OrthogonalMatchingPursuit(fit_intercept=True, n_nonzero_coefs=None,']\n", "[\"normalize=True, precompute='auto', tol=None), None]\"]\n", "['2020-07-29 09', '47', '34,211', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '34,211', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '34,263', 'INFO', 'Initializing Bayesian Ridge']\n", "['2020-07-29 09', '47', '34,269', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '34,277', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,284', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,286', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,287', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,295', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '34,304', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,311', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,314', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,314', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,323', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '34,331', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,339', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,341', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,342', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,350', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '34,357', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,364', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,367', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,367', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,375', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '34,383', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,391', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,393', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,393', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,402', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '34,402', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '34,420', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '34,507', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '34,507', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '34,508', 'INFO', 'save_model(model=BayesianRidge(alpha_1=1e-06, alpha_2=1e-06, alpha_init=None,']\n", "['compute_score=False, copy_X=True, fit_intercept=True,']\n", "['lambda_1=1e-06, lambda_2=1e-06, lambda_init=None, n_iter=300,']\n", "['normalize=False, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '47', '34,508', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '34,516', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '34,523', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), BayesianRidge(alpha_1=1e-06, alpha_2=1e-06, alpha_init=None,']\n", "['compute_score=False, copy_X=True, fit_intercept=True,']\n", "['lambda_1=1e-06, lambda_2=1e-06, lambda_init=None, n_iter=300,']\n", "['normalize=False, tol=0.001, verbose=False), None]']\n", "['2020-07-29 09', '47', '34,524', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '34,524', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '34,625', 'INFO', 'Initializing Passive Aggressive Regressor']\n", "['2020-07-29 09', '47', '34,633', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '34,640', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,651', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,654', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,654', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,664', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '34,672', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,683', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,685', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,686', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,696', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '34,705', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,715', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,717', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,717', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,726', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '34,735', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,746', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,749', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,749', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,759', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '34,767', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '34,777', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '34,779', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '34,779', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '34,790', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '34,790', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '34,808', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '34,904', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '34,904', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '34,905', 'INFO', 'save_model(model=PassiveAggressiveRegressor(C=1.0, average=False, early_stopping=False,']\n", "['epsilon=0.1, fit_intercept=True,']\n", "[\"loss='epsilon_insensitive', max_iter=1000,\"]\n", "['n_iter_no_change=5, random_state=123, shuffle=True,']\n", "['tol=0.001, validation_fraction=0.1, verbose=0,']\n", "['warm_start=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '47', '34,905', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '34,914', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '34,922', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), PassiveAggressiveRegressor(C=1.0, average=False, early_stopping=False,']\n", "['epsilon=0.1, fit_intercept=True,']\n", "[\"loss='epsilon_insensitive', max_iter=1000,\"]\n", "['n_iter_no_change=5, random_state=123, shuffle=True,']\n", "['tol=0.001, validation_fraction=0.1, verbose=0,']\n", "['warm_start=False), None]']\n", "['2020-07-29 09', '47', '34,922', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '34,922', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '35,002', 'INFO', 'Initializing Random Sample Consensus']\n", "['2020-07-29 09', '47', '35,011', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '35,023', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '35,179', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '35,182', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '35,183', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '35,194', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '35,203', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '35,358', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '35,361', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '35,361', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '35,371', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '35,381', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '35,533', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '35,535', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '35,535', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '35,547', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '35,556', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '35,711', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '35,714', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '35,715', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '35,727', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '35,737', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '35,875', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '35,878', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '35,878', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '35,889', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '35,889', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '35,911', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '36,020', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '36,020', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '36,020', 'INFO', 'save_model(model=RANSACRegressor(base_estimator=None, is_data_valid=None, is_model_valid=None,']\n", "[\"loss='absolute_loss', max_skips=inf, max_trials=100,\"]\n", "['min_samples=0.5, random_state=123, residual_threshold=None,']\n", "['stop_n_inliers=inf, stop_probability=0.99, stop_score=inf), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '47', '36,020', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '36,029', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '36,039', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), RANSACRegressor(base_estimator=None, is_data_valid=None, is_model_valid=None,']\n", "[\"loss='absolute_loss', max_skips=inf, max_trials=100,\"]\n", "['min_samples=0.5, random_state=123, residual_threshold=None,']\n", "['stop_n_inliers=inf, stop_probability=0.99, stop_score=inf), None]']\n", "['2020-07-29 09', '47', '36,039', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '36,039', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '36,159', 'INFO', 'Initializing TheilSen Regressor']\n", "['2020-07-29 09', '47', '36,168', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '36,178', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '42,054', 'INFO', 'PyCaret Clustering Module']\n", "['2020-07-29 09', '47', '42,054', 'INFO', 'version pycaret-nightly-0.39']\n", "['2020-07-29 09', '47', '42,055', 'INFO', 'Initializing setup()']\n", "['2020-07-29 09', '47', '42,055', 'INFO', 'USI', 'e74c']\n", "['2020-07-29 09', '47', '42,056', 'INFO', 'setup(data=(224, 21), categorical_features=None, categorical_imputation=constant, ordinal_features=None, high_cardinality_features=None,']\n", "[\"numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=['Country Name'], normalize=False,\"]\n", "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None,']\n", "['remove_multicollinearity=False, multicollinearity_threshold=0.9, group_features=None,']\n", "['group_names=None, supervised=False, supervised_target=None, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", "['experiment_name=health1, log_plots=True, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", "['2020-07-29 09', '47', '42,057', 'INFO', 'Checking environment']\n", "['2020-07-29 09', '47', '42,058', 'INFO', 'python_version', '3.6.10']\n", "['2020-07-29 09', '47', '42,058', 'INFO', 'python_build', \"('default', 'May 7 2020 19\", '46', \"08')\"]\n", "['2020-07-29 09', '47', '42,059', 'INFO', 'machine', 'AMD64']\n", "['2020-07-29 09', '47', '42,060', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", "['2020-07-29 09', '47', '42,272', 'INFO', 'Memory', 'svmem(total=17032478720, available=5177511936, percent=69.6, used=11854966784, free=5177511936)']\n", "['2020-07-29 09', '47', '42,272', 'INFO', 'Physical Core', '4']\n", "['2020-07-29 09', '47', '42,273', 'INFO', 'Logical Core', '8']\n", "['2020-07-29 09', '47', '42,273', 'INFO', 'Checking libraries']\n", "['2020-07-29 09', '47', '42,273', 'INFO', 'pd==1.0.4']\n", "['2020-07-29 09', '47', '42,283', 'INFO', 'numpy==1.18.5']\n", "['2020-07-29 09', '47', '43,243', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '43,252', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '43,252', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '43,276', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '43,295', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '43,989', 'INFO', 'sklearn==0.23.1']\n", "['2020-07-29 09', '47', '43,991', 'INFO', 'kmodes==0.10.2']\n", "['2020-07-29 09', '47', '45,076', 'INFO', 'PyCaret Anomaly Detection Module']\n", "['2020-07-29 09', '47', '45,076', 'INFO', 'version pycaret-nightly-0.39']\n", "['2020-07-29 09', '47', '45,076', 'INFO', 'Initializing setup()']\n", "['2020-07-29 09', '47', '45,076', 'INFO', 'USI', '9b51']\n", "['2020-07-29 09', '47', '45,077', 'INFO', 'setup(data=(1000, 10), categorical_features=None, categorical_imputation=constant, ordinal_features=None, high_cardinality_features=None,']\n", "['numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=None, normalize=False,']\n", "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None,']\n", "['remove_multicollinearity=False, multicollinearity_threshold=0.9, group_features=None,']\n", "['group_names=None, supervised=False, supervised_target=None, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", "['experiment_name=anomaly1, log_plots=False, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", "['2020-07-29 09', '47', '45,077', 'INFO', 'Checking environment']\n", "['2020-07-29 09', '47', '45,078', 'INFO', 'python_version', '3.6.10']\n", "['2020-07-29 09', '47', '45,078', 'INFO', 'python_build', \"('default', 'May 7 2020 19\", '46', \"08')\"]\n", "['2020-07-29 09', '47', '45,078', 'INFO', 'machine', 'AMD64']\n", "['2020-07-29 09', '47', '45,079', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", "['2020-07-29 09', '47', '45,083', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '45,089', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '45,090', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '45,113', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '45,133', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '45,136', 'INFO', 'Memory', 'svmem(total=17032478720, available=5155127296, percent=69.7, used=11877351424, free=5155127296)']\n", "['2020-07-29 09', '47', '45,137', 'INFO', 'Physical Core', '4']\n", "['2020-07-29 09', '47', '45,137', 'INFO', 'Logical Core', '8']\n", "['2020-07-29 09', '47', '45,137', 'INFO', 'Checking libraries']\n", "['2020-07-29 09', '47', '45,137', 'INFO', 'pd==1.0.4']\n", "['2020-07-29 09', '47', '45,138', 'INFO', 'numpy==1.18.5']\n", "['2020-07-29 09', '47', '45,767', 'INFO', 'mlflow==1.8.0']\n", "['2020-07-29 09', '47', '45,768', 'INFO', 'Checking Exceptions']\n", "['2020-07-29 09', '47', '45,769', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '47', '45,850', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '47', '45,903', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '47', '45,903', 'INFO', 'Declaring global variables']\n", "['2020-07-29 09', '47', '45,904', 'INFO', 'Copying data for preprocessing']\n", "['2020-07-29 09', '47', '45,920', 'INFO', 'Declaring preprocessing parameters']\n", "['2020-07-29 09', '47', '45,921', 'INFO', 'Importing preprocessing module']\n", "['2020-07-29 09', '47', '47,044', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '47,054', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '47,055', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '47,083', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '47,108', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '48,011', 'WARNING', 'pyod not found']\n", "['2020-07-29 09', '47', '48,500', 'INFO', 'Creating preprocessing pipeline']\n", "['2020-07-29 09', '47', '49,140', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '49,146', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '49,146', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '49,170', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '49,194', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '49,891', 'INFO', 'Preprocessing pipeline created successfully']\n", "['2020-07-29 09', '47', '49,892', 'INFO', 'Creating grid variables']\n", "['2020-07-29 09', '47', '49,896', 'INFO', 'Creating global containers']\n", "['2020-07-29 09', '47', '49,930', 'INFO', 'mlflow==1.8.0']\n", "['2020-07-29 09', '47', '49,931', 'INFO', 'Checking Exceptions']\n", "['2020-07-29 09', '47', '49,931', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '47', '50,035', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '47', '50,094', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '47', '50,094', 'INFO', 'Declaring global variables']\n", "['2020-07-29 09', '47', '50,094', 'INFO', 'Copying data for preprocessing']\n", "['2020-07-29 09', '47', '50,112', 'INFO', 'Declaring preprocessing parameters']\n", "['2020-07-29 09', '47', '50,112', 'INFO', 'Importing preprocessing module']\n", "['2020-07-29 09', '47', '51,064', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '51,070', 'INFO', 'Logging experiment in MLFlow']\n", "['2020-07-29 09', '47', '51,071', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '51,071', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '51,100', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '51,101', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '51,167', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '51,238', 'INFO', 'Creating preprocessing pipeline']\n", "['2020-07-29 09', '47', '51,321', 'INFO', 'PyCaret NLP Module']\n", "['2020-07-29 09', '47', '51,321', 'INFO', 'version pycaret-nightly-0.39']\n", "['2020-07-29 09', '47', '51,322', 'INFO', 'Initializing setup()']\n", "['2020-07-29 09', '47', '51,322', 'INFO', 'USI', 'ab65']\n", "['2020-07-29 09', '47', '51,322', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=True, session_id=123, log_experiment=True,']\n", "['experiment_name=kiva1, log_plots=True, log_data=False, verbose=True)']\n", "['2020-07-29 09', '47', '51,323', 'INFO', 'Checking environment']\n", "['2020-07-29 09', '47', '51,323', 'INFO', 'python_version', '3.6.10']\n", "['2020-07-29 09', '47', '51,323', 'INFO', 'python_build', \"('default', 'May 7 2020 19\", '46', \"08')\"]\n", "['2020-07-29 09', '47', '51,323', 'INFO', 'machine', 'AMD64']\n", "['2020-07-29 09', '47', '51,324', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", "['2020-07-29 09', '47', '51,402', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '51,402', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '51,404', 'INFO', 'save_model(model=TheilSenRegressor(copy_X=True, fit_intercept=True, max_iter=300,']\n", "['max_subpopulation=10000, n_jobs=-1, n_subsamples=None,']\n", "['random_state=123, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '47', '51,404', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '51,411', 'INFO', 'Memory', 'svmem(total=17032478720, available=5093425152, percent=70.1, used=11939053568, free=5093425152)']\n", "['2020-07-29 09', '47', '51,412', 'INFO', 'Physical Core', '4']\n", "['2020-07-29 09', '47', '51,412', 'INFO', 'Logical Core', '8']\n", "['2020-07-29 09', '47', '51,412', 'INFO', 'Checking libraries']\n", "['2020-07-29 09', '47', '51,412', 'INFO', 'pd==1.0.4']\n", "['2020-07-29 09', '47', '51,413', 'INFO', 'numpy==1.18.5']\n", "['2020-07-29 09', '47', '51,431', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '51,463', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), TheilSenRegressor(copy_X=True, fit_intercept=True, max_iter=300,']\n", "['max_subpopulation=10000, n_jobs=-1, n_subsamples=None,']\n", "['random_state=123, tol=0.001, verbose=False), None]']\n", "['2020-07-29 09', '47', '51,463', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '51,463', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '51,703', 'INFO', 'Initializing Huber Regressor']\n", "['2020-07-29 09', '47', '51,722', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '51,746', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '51,869', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '51,870', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '51,897', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", "['2020-07-29 09', '47', '51,897', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '51,912', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '51,922', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '51,926', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '51,926', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '51,942', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "['verbose=False), Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "['verbose=False)]']\n", "['2020-07-29 09', '47', '51,942', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '51,943', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '51,951', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '51,969', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '52,110', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '52,118', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '52,118', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '52,131', 'INFO', 'Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "['verbose=False)']\n", "['2020-07-29 09', '47', '52,132', 'INFO', 'setup() succesfully completed......................................']\n", "['2020-07-29 09', '47', '52,142', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '52,165', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '52,296', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '52,301', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '52,302', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '52,321', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '52,340', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '52,469', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '52,473', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '52,473', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '52,491', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '52,507', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '52,632', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '52,638', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '52,638', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '52,653', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '52,654', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '52,688', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '52,825', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '52,825', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '52,826', 'INFO', 'save_model(model=HuberRegressor(alpha=0.0001, epsilon=1.35, fit_intercept=True, max_iter=100,']\n", "['tol=1e-05, warm_start=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '47', '52,826', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '52,841', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '52,854', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), HuberRegressor(alpha=0.0001, epsilon=1.35, fit_intercept=True, max_iter=100,']\n", "['tol=1e-05, warm_start=False), None]']\n", "['2020-07-29 09', '47', '52,854', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '52,854', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '53,009', 'INFO', 'Initializing Support Vector Machine']\n", "['2020-07-29 09', '47', '53,023', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '53,040', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '53,106', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '53,120', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '53,120', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '53,135', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '53,149', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '53,211', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '53,223', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '53,223', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '53,237', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '53,250', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '53,304', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '53,313', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '53,314', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '53,326', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '53,341', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '53,367', 'INFO', 'gensim==3.8.3']\n", "['2020-07-29 09', '47', '53,398', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '53,410', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '53,410', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '53,424', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '53,436', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '53,489', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '53,500', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '53,500', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '53,513', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '53,513', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '53,544', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '53,668', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '53,668', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '53,669', 'INFO', \"save_model(model=SVR(C=1.0, cache_size=200, coef0=0.0, degree=3, epsilon=0.1, gamma='scale',\"]\n", "[\"kernel='rbf', max_iter=-1, shrinking=True, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '47', '53,669', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '53,680', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '53,690', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), SVR(C=1.0, cache_size=200, coef0=0.0, degree=3, epsilon=0.1, gamma='scale',\"]\n", "[\"kernel='rbf', max_iter=-1, shrinking=True, tol=0.001, verbose=False), None]\"]\n", "['2020-07-29 09', '47', '53,690', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '53,690', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '53,805', 'INFO', 'Initializing K Neighbors Regressor']\n", "['2020-07-29 09', '47', '53,817', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '53,831', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '53,838', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '53,953', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '53,953', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '53,968', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '53,981', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '53,989', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '54,057', 'INFO', 'spacy==2.2.4']\n", "['2020-07-29 09', '47', '54,099', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '54,100', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '54,115', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '54,126', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '54,134', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '54,243', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '54,243', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '54,256', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '54,266', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '54,275', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '54,384', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '54,384', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '54,395', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '54,405', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '54,414', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '54,524', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '54,525', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '54,538', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '54,539', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '54,572', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '54,705', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '54,705', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '54,706', 'INFO', \"save_model(model=KNeighborsRegressor(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", "[\"weights='uniform'), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '47', '54,707', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '54,723', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '54,740', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), KNeighborsRegressor(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", "[\"weights='uniform'), None]\"]\n", "['2020-07-29 09', '47', '54,740', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '54,740', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '54,857', 'INFO', 'nltk==3.5']\n", "['2020-07-29 09', '47', '54,892', 'INFO', 'Initializing Decision Tree']\n", "['2020-07-29 09', '47', '54,902', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '54,921', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '54,924', 'INFO', 'textblob==0.15.3']\n", "['2020-07-29 09', '47', '54,932', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '54,935', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '54,935', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '54,949', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '54,965', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '54,978', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '54,983', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '54,984', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '55,005', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '55,021', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '55,032', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '55,036', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '47', '55,036', 'INFO', 'create_model(model=kmeans, num_clusters=4, ground_truth=None, verbose=True, system=True)']\n", "['2020-07-29 09', '47', '55,036', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '47', '55,037', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '47', '55,037', 'INFO', 'Setting num_cluster param']\n", "['2020-07-29 09', '47', '55,037', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '47', '55,038', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '55,038', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '55,057', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '55,077', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '55,078', 'INFO', 'Importing untrained model']\n", "['2020-07-29 09', '47', '55,078', 'INFO', 'K-Means Clustering Imported succesfully']\n", "['2020-07-29 09', '47', '55,094', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '55,098', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '55,102', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '55,102', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '55,122', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '55,141', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '55,158', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '55,163', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '55,163', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '55,189', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '55,190', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '55,214', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '55,232', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '55,236', 'INFO', 'Creating Metrics dataframe']\n", "['2020-07-29 09', '47', '55,245', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '55,417', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '55,417', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '55,419', 'INFO', \"save_model(model=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", "['max_features=None, max_leaf_nodes=None,']\n", "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", "['min_samples_leaf=1, min_samples_split=2,']\n", "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '47', '55,419', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '55,437', 'INFO', 'SubProcess plot_model() called ==================================']\n", "['2020-07-29 09', '47', '55,437', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '47', '55,438', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=cluster, feature=None, label=False, save=True, system=False)']\n", "['2020-07-29 09', '47', '55,439', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '55,439', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '47', '55,439', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '47', '55,465', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", "['max_features=None, max_leaf_nodes=None,']\n", "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", "['min_samples_leaf=1, min_samples_split=2,']\n", "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", "[\"random_state=123, splitter='best'), None]\"]\n", "['2020-07-29 09', '47', '55,466', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '55,466', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '55,656', 'INFO', 'Initializing Random Forest']\n", "['2020-07-29 09', '47', '55,675', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '47', '55,694', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '56,059', 'INFO', 'pyLDAvis==2.1.2']\n", "['2020-07-29 09', '47', '56,271', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '56,275', 'INFO', 'wordcloud==1.7.0']\n", "['2020-07-29 09', '47', '56,383', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '56,384', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '56,401', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '47', '56,417', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '56,825', 'INFO', 'Preprocessing pipeline created successfully']\n", "['2020-07-29 09', '47', '56,826', 'INFO', 'Creating grid variables']\n", "['2020-07-29 09', '47', '56,829', 'INFO', 'Creating global containers']\n", "['2020-07-29 09', '47', '56,945', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '57,059', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '57,060', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '57,086', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '47', '57,104', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '57,516', 'INFO', 'mlflow==1.8.0']\n", "['2020-07-29 09', '47', '57,516', 'INFO', 'Checking Exceptions']\n", "['2020-07-29 09', '47', '57,718', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '57,739', 'INFO', 'Logging experiment in MLFlow']\n", "['2020-07-29 09', '47', '57,833', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '57,834', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '57,859', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '47', '57,881', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '58,479', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '58,479', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '58,508', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_L...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", "['2020-07-29 09', '47', '58,508', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '58,521', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '58,552', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_L...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "['verbose=False), Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_L...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "['verbose=False)]']\n", "['2020-07-29 09', '47', '58,552', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '58,552', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '58,578', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '58,692', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '58,693', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '58,708', 'INFO', 'Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_L...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "['verbose=False)']\n", "['2020-07-29 09', '47', '58,708', 'INFO', 'setup() succesfully completed......................................']\n", "['2020-07-29 09', '47', '58,714', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '47', '58,735', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '47', '59,302', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '47', '59,421', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '47', '59,422', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '47', '59,443', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '47', '59,444', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '47', '59,489', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '47', '59,672', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '47', '59,672', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '47', '59,674', 'INFO', \"save_model(model=RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", "['max_samples=None, min_impurity_decrease=0.0,']\n", "['min_impurity_split=None, min_samples_leaf=1,']\n", "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '47', '59,674', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '47', '59,703', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '47', '59,789', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '47', '59,796', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '47', '59,811', 'INFO', 'plot type', 'cluster']\n", "['2020-07-29 09', '47', '59,812', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '47', '59,812', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '47', '59,812', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", "['max_samples=None, min_impurity_decrease=0.0,']\n", "['min_impurity_split=None, min_samples_leaf=1,']\n", "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", "['random_state=123, verbose=0, warm_start=False), None]']\n", "['2020-07-29 09', '47', '59,812', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '59,812', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '47', '59,812', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", "['2020-07-29 09', '47', '59,812', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '47', '59,813', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '47', '59,813', 'INFO', 'Copying data']\n", "['2020-07-29 09', '47', '59,813', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", "['2020-07-29 09', '47', '59,814', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '47', '59,849', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '47', '59,850', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '47', '59,850', 'INFO', '(224, 21)']\n", "['2020-07-29 09', '47', '59,851', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '47', '59,851', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '47', '59,858', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '47', '59,859', 'INFO', 'Declaring global variables']\n", "['2020-07-29 09', '47', '59,860', 'INFO', 'Input provided', 'dataframe']\n", "['2020-07-29 09', '47', '59,860', 'INFO', 'session_id set to', '123']\n", "['2020-07-29 09', '47', '59,860', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '47', '59,864', 'INFO', 'Importing stopwords from nltk']\n", "['2020-07-29 09', '47', '59,876', 'INFO', 'Fitting PCA()']\n", "['2020-07-29 09', '47', '59,891', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '47', '59,897', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '47', '59,977', 'INFO', 'Initializing Extra Trees Regressor']\n", "['2020-07-29 09', '47', '59,992', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '48', '00,014', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '00,280', 'INFO', 'No custom stopwords defined']\n", "['2020-07-29 09', '48', '00,282', 'INFO', 'Removing numeric characters from the text']\n", "['2020-07-29 09', '48', '00,441', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '48', '00,553', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '48', '00,554', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '48', '00,576', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '48', '00,594', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '00,820', 'INFO', 'Removing special characters from the text']\n", "['2020-07-29 09', '48', '01,075', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '48', '01,191', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '48', '01,192', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '48', '01,219', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '48', '01,241', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '01,696', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '48', '01,807', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '48', '01,807', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '48', '01,823', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '48', '01,836', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '02,159', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '48', '02,269', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '48', '02,270', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '48', '02,285', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '48', '02,305', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '02,353', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '48', '02,353', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '02,353', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '48', '02,354', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '48', '02,421', 'INFO', 'Importing untrained model']\n", "['2020-07-29 09', '48', '02,422', 'INFO', 'Isolation Forest Imported succesfully']\n", "['2020-07-29 09', '48', '02,449', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '02,813', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '48', '02,928', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '48', '02,929', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '48', '02,953', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '48', '02,954', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '48', '03,011', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '48', '03,241', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '48', '03,242', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '48', '03,244', 'INFO', \"save_model(model=ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", "['max_samples=None, min_impurity_decrease=0.0,']\n", "['min_impurity_split=None, min_samples_leaf=1,']\n", "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '48', '03,244', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '48', '03,413', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '48', '03,441', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", "['max_samples=None, min_impurity_decrease=0.0,']\n", "['min_impurity_split=None, min_samples_leaf=1,']\n", "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", "['random_state=123, verbose=0, warm_start=False), None]']\n", "['2020-07-29 09', '48', '03,441', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '03,442', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '48', '03,744', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '48', '03,753', 'INFO', 'Initializing AdaBoost Regressor']\n", "['2020-07-29 09', '48', '03,780', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '48', '03,810', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '03,946', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '48', '03,960', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '48', '03,961', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '48', '03,961', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '48', '03,961', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '48', '03,962', 'INFO', \"save_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '48', '03,962', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '48', '03,999', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '48', '04,028', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '04,118', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '48', '04,126', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '48', '04,127', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '48', '04,146', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '48', '04,165', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '04,169', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '48', '04,188', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_L...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "[\"verbose=False), IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0)]']\n", "['2020-07-29 09', '48', '04,188', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '04,189', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '48', '04,228', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '48', '04,238', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '48', '04,238', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '48', '04,265', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '48', '04,290', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '04,301', 'INFO', \"IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0)']\n", "['2020-07-29 09', '48', '04,301', 'INFO', 'create_models() succesfully completed......................................']\n", "['2020-07-29 09', '48', '04,317', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '48', '04,318', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '04,318', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '48', '04,318', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '48', '04,350', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '48', '04,360', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '48', '04,360', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '48', '04,389', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '48', '04,395', 'INFO', 'Importing untrained model']\n", "['2020-07-29 09', '48', '04,396', 'INFO', 'k-Nearest Neighbors Detector Imported succesfully']\n", "['2020-07-29 09', '48', '04,412', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '04,415', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '04,484', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '48', '04,484', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '48', '04,494', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '48', '04,494', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '48', '04,518', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '48', '04,519', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '48', '04,583', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '48', '04,697', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '48', '04,698', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '48', '04,699', 'INFO', \"save_model(model=KNN(algorithm='auto', contamination=0.1, leaf_size=30, method='largest',\"]\n", "[\"metric='minkowski', metric_params=None, n_jobs=1, n_neighbors=5, p=2,\"]\n", "['radius=1.0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '48', '04,700', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '48', '04,725', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '48', '04,747', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_L...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "[\"verbose=False), KNN(algorithm='auto', contamination=0.1, leaf_size=30, method='largest',\"]\n", "[\"metric='minkowski', metric_params=None, n_jobs=1, n_neighbors=5, p=2,\"]\n", "['radius=1.0)]']\n", "['2020-07-29 09', '48', '04,747', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '04,748', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '48', '04,794', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '48', '04,794', 'INFO', 'Initializing save_model()']\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "['2020-07-29 09', '48', '04,795', 'INFO', \"save_model(model=AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '48', '04,796', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '48', '04,831', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '48', '04,855', 'INFO', \"KNN(algorithm='auto', contamination=0.1, leaf_size=30, method='largest',\"]\n", "[\"metric='minkowski', metric_params=None, n_jobs=1, n_neighbors=5, p=2,\"]\n", "['radius=1.0)']\n", "['2020-07-29 09', '48', '04,855', 'INFO', 'create_models() succesfully completed......................................']\n", "['2020-07-29 09', '48', '04,856', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", "['n_estimators=50, random_state=123), None]']\n", "['2020-07-29 09', '48', '04,856', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '04,856', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '48', '04,871', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '48', '04,873', 'INFO', \"assign_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0), transformation=False, score=True, verbose=True)']\n", "['2020-07-29 09', '48', '04,873', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '48', '04,874', 'INFO', 'Copying data']\n", "['2020-07-29 09', '48', '04,876', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '48', '04,952', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '48', '04,953', 'INFO', 'Trained Model', 'Assigned Isolation Forest']\n", "['2020-07-29 09', '48', '04,956', 'INFO', '(1000, 12)']\n", "['2020-07-29 09', '48', '04,957', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '05,009', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '48', '05,010', 'INFO', \"plot_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0), plot=tsne, feature=None, save=False, system=True)']\n", "['2020-07-29 09', '48', '05,011', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '05,011', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '48', '05,796', 'INFO', 'Tokenizing Words']\n", "['2020-07-29 09', '48', '06,772', 'INFO', \"Saving 'Cluster.html' in current active directory\"]\n", "['2020-07-29 09', '48', '06,773', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '48', '06,773', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '07,650', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '48', '07,651', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=distribution, feature=None, label=False, save=True, system=False)']\n", "['2020-07-29 09', '48', '07,652', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '07,652', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '48', '07,672', 'INFO', 'plot type', 'distribution']\n", "['2020-07-29 09', '48', '07,672', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '48', '07,672', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '48', '07,674', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=False, verbose=False)']\n", "['2020-07-29 09', '48', '07,674', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '07,675', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '48', '07,675', 'INFO', 'Copying data']\n", "['2020-07-29 09', '48', '07,676', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '48', '07,711', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '48', '07,713', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '48', '07,714', 'INFO', '(224, 22)']\n", "['2020-07-29 09', '48', '07,714', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '07,715', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '48', '07,715', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '48', '07,732', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '48', '08,329', 'INFO', \"Saving 'Distribution.html' in current active directory\"]\n", "['2020-07-29 09', '48', '08,329', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '48', '08,329', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '08,812', 'INFO', 'plot type', 'tsne']\n", "['2020-07-29 09', '48', '08,813', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '48', '08,813', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '48', '08,814', 'INFO', \"assign_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0), transformation=True, score=False, verbose=False)']\n", "['2020-07-29 09', '48', '08,814', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '48', '08,815', 'INFO', 'Copying data']\n", "['2020-07-29 09', '48', '08,815', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '48', '08,849', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '48', '08,850', 'INFO', 'Trained Model', 'Assigned Isolation Forest']\n", "['2020-07-29 09', '48', '08,851', 'INFO', '(1000, 11)']\n", "['2020-07-29 09', '48', '08,851', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '08,852', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '48', '08,870', 'INFO', 'Getting dummies to cast categorical variables']\n", "['2020-07-29 09', '48', '08,885', 'INFO', 'Fitting TSNE()']\n", "['2020-07-29 09', '48', '09,534', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '48', '09,535', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=elbow, feature=None, label=False, save=True, system=False)']\n", "['2020-07-29 09', '48', '09,535', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '09,536', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '48', '09,562', 'INFO', 'plot type', 'elbow']\n", "['2020-07-29 09', '48', '09,834', 'INFO', 'Fitting KElbowVisualizer()']\n", "['2020-07-29 09', '48', '11,999', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '48', '13,890', 'INFO', \"Saving 'Elbow.png' in current active directory\"]\n", "['2020-07-29 09', '48', '13,890', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '48', '13,891', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '13,931', 'INFO', 'SubProcess plot_model() end ==================================']\n", "['2020-07-29 09', '48', '13,932', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '48', '13,932', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '48', '13,934', 'INFO', \"save_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '48', '13,934', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '48', '13,953', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '48', '13,975', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "[\"verbose=False), KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0)]']\n", "['2020-07-29 09', '48', '13,975', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '13,976', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '48', '14,077', 'INFO', \"KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0)']\n", "['2020-07-29 09', '48', '14,078', 'INFO', 'create_models() succesfully completed......................................']\n", "['2020-07-29 09', '48', '14,099', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '48', '14,100', 'INFO', 'create_model(model=kmodes, num_clusters=4, ground_truth=None, verbose=True, system=True)']\n", "['2020-07-29 09', '48', '14,100', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '14,101', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '48', '14,102', 'INFO', 'Setting num_cluster param']\n", "['2020-07-29 09', '48', '14,102', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '48', '14,162', 'INFO', 'Importing untrained model']\n", "['2020-07-29 09', '48', '14,178', 'INFO', 'K-Modes Clustering Imported succesfully']\n", "['2020-07-29 09', '48', '14,201', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '48', '20,873', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '48', '20,911', 'INFO', 'Creating Metrics dataframe']\n", "['2020-07-29 09', '48', '20,919', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '48', '21,190', 'INFO', 'SubProcess plot_model() called ==================================']\n", "['2020-07-29 09', '48', '21,190', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '48', '21,192', 'INFO', \"plot_model(model=KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0), plot=cluster, feature=None, label=False, save=True, system=False)']\n", "['2020-07-29 09', '48', '21,192', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '21,192', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '48', '21,221', 'INFO', 'plot type', 'cluster']\n", "['2020-07-29 09', '48', '21,221', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '48', '21,221', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '48', '21,223', 'INFO', \"assign_model(model=KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0), transformation=True, verbose=False)']\n", "['2020-07-29 09', '48', '21,223', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '21,223', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '48', '21,224', 'INFO', 'Copying data']\n", "['2020-07-29 09', '48', '21,224', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", "['2020-07-29 09', '48', '21,225', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '48', '21,271', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '48', '21,273', 'INFO', 'Trained Model', 'K-Modes Clustering']\n", "['2020-07-29 09', '48', '21,274', 'INFO', '(224, 21)']\n", "['2020-07-29 09', '48', '21,274', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '21,275', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '48', '21,292', 'INFO', 'Fitting PCA()']\n", "['2020-07-29 09', '48', '21,315', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '48', '21,323', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '48', '21,784', 'INFO', \"Saving 'Cluster.html' in current active directory\"]\n", "['2020-07-29 09', '48', '21,784', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '48', '21,785', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '21,905', 'INFO', 'Removing stopwords']\n", "['2020-07-29 09', '48', '23,356', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '48', '23,357', 'INFO', \"plot_model(model=KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0), plot=distribution, feature=None, label=False, save=True, system=False)']\n", "['2020-07-29 09', '48', '23,357', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '23,357', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '48', '23,386', 'INFO', 'plot type', 'distribution']\n", "['2020-07-29 09', '48', '23,387', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '48', '23,387', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '48', '23,388', 'INFO', \"assign_model(model=KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0), transformation=False, verbose=False)']\n", "['2020-07-29 09', '48', '23,388', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '23,388', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '48', '23,388', 'INFO', 'Copying data']\n", "['2020-07-29 09', '48', '23,391', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '48', '23,427', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '48', '23,428', 'INFO', 'Trained Model', 'K-Modes Clustering']\n", "['2020-07-29 09', '48', '23,429', 'INFO', '(224, 22)']\n", "['2020-07-29 09', '48', '23,429', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '23,429', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '48', '23,430', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '48', '23,439', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '48', '24,069', 'INFO', \"Saving 'Distribution.html' in current active directory\"]\n", "['2020-07-29 09', '48', '24,069', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '48', '24,070', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '25,580', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '48', '25,582', 'INFO', \"plot_model(model=KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0), plot=elbow, feature=None, label=False, save=True, system=False)']\n", "['2020-07-29 09', '48', '25,582', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '25,582', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '48', '25,604', 'INFO', 'plot type', 'elbow']\n", "['2020-07-29 09', '48', '25,658', 'INFO', 'Fitting KElbowVisualizer()']\n", "['2020-07-29 09', '48', '32,253', 'INFO', 'Extracting Bigrams']\n", "['2020-07-29 09', '48', '41,062', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '48', '41,646', 'INFO', \"Saving 'Elbow.png' in current active directory\"]\n", "['2020-07-29 09', '48', '41,646', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '48', '41,646', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '41,692', 'INFO', 'SubProcess plot_model() end ==================================']\n", "['2020-07-29 09', '48', '41,692', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '48', '41,693', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '48', '41,694', 'INFO', \"save_model(model=KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '48', '41,694', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '48', '42,305', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '48', '42,330', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "[\"verbose=False), KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0)]']\n", "['2020-07-29 09', '48', '42,330', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '42,330', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '48', '42,451', 'INFO', \"KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0)']\n", "['2020-07-29 09', '48', '42,451', 'INFO', 'create_models() succesfully completed......................................']\n", "['2020-07-29 09', '48', '42,468', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '48', '42,469', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=False, verbose=True)']\n", "['2020-07-29 09', '48', '42,470', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '42,470', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '48', '42,470', 'INFO', 'Copying data']\n", "['2020-07-29 09', '48', '42,472', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '48', '42,563', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '48', '42,573', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '48', '42,576', 'INFO', '(224, 22)']\n", "['2020-07-29 09', '48', '42,577', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '42,694', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '48', '42,695', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=cluster, feature=None, label=False, save=False, system=True)']\n", "['2020-07-29 09', '48', '42,696', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '42,696', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '48', '42,737', 'INFO', 'plot type', 'cluster']\n", "['2020-07-29 09', '48', '42,737', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '48', '42,738', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '48', '42,739', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", "['2020-07-29 09', '48', '42,740', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '42,740', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '48', '42,740', 'INFO', 'Copying data']\n", "['2020-07-29 09', '48', '42,741', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", "['2020-07-29 09', '48', '42,741', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '48', '42,782', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '48', '42,788', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '48', '42,789', 'INFO', '(224, 21)']\n", "['2020-07-29 09', '48', '42,789', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '42,790', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '48', '42,805', 'INFO', 'Fitting PCA()']\n", "['2020-07-29 09', '48', '42,824', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '48', '42,833', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '48', '43,140', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '48', '43,140', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '43,154', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '48', '43,156', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=cluster, feature=Country Name, label=True, save=False, system=True)']\n", "['2020-07-29 09', '48', '43,156', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '43,157', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '48', '43,186', 'INFO', 'plot type', 'cluster']\n", "['2020-07-29 09', '48', '43,188', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '48', '43,188', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '48', '43,192', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", "['2020-07-29 09', '48', '43,192', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '43,193', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '48', '43,193', 'INFO', 'Copying data']\n", "['2020-07-29 09', '48', '43,194', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", "['2020-07-29 09', '48', '43,194', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '48', '43,230', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '48', '43,232', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '48', '43,233', 'INFO', '(224, 21)']\n", "['2020-07-29 09', '48', '43,233', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '43,233', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '48', '43,246', 'INFO', 'Fitting PCA()']\n", "['2020-07-29 09', '48', '43,268', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '48', '43,274', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '48', '43,585', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '48', '43,585', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '43,599', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '48', '43,601', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=tsne, feature=None, label=False, save=False, system=True)']\n", "['2020-07-29 09', '48', '43,602', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '43,602', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '48', '43,658', 'INFO', 'plot type', 'tsne']\n", "['2020-07-29 09', '48', '43,659', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '48', '43,659', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '48', '43,661', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", "['2020-07-29 09', '48', '43,662', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '43,662', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '48', '43,663', 'INFO', 'Copying data']\n", "['2020-07-29 09', '48', '43,664', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", "['2020-07-29 09', '48', '43,664', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '48', '43,711', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '48', '43,713', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '48', '43,714', 'INFO', '(224, 21)']\n", "['2020-07-29 09', '48', '43,714', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '43,714', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '48', '43,718', 'INFO', 'Fitting TSNE()']\n", "['2020-07-29 09', '48', '49,461', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '48', '59,261', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '48', '59,268', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '48', '59,625', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '48', '59,626', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '48', '59,656', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '48', '59,658', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=elbow, feature=None, label=False, save=False, system=True)']\n", "['2020-07-29 09', '48', '59,658', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '48', '59,658', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '48', '59,688', 'INFO', 'plot type', 'elbow']\n", "['2020-07-29 09', '48', '59,688', 'INFO', 'Fitting KElbowVisualizer()']\n", "['2020-07-29 09', '49', '01,501', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '49', '01,501', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '01,532', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '49', '01,533', 'INFO', \"plot_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0), plot=umap, feature=None, save=False, system=True)']\n", "['2020-07-29 09', '49', '01,533', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '49', '01,533', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '49', '01,555', 'INFO', 'plot type', 'umap']\n", "['2020-07-29 09', '49', '01,556', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '49', '01,556', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '49', '01,556', 'INFO', \"assign_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0), transformation=True, score=False, verbose=False)']\n", "['2020-07-29 09', '49', '01,557', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '49', '01,557', 'INFO', 'Copying data']\n", "['2020-07-29 09', '49', '01,558', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '49', '01,588', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '49', '01,589', 'INFO', 'Trained Model', 'Assigned Isolation Forest']\n", "['2020-07-29 09', '49', '01,590', 'INFO', '(1000, 11)']\n", "['2020-07-29 09', '49', '01,590', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '01,590', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '49', '01,598', 'INFO', 'Getting dummies to cast categorical variables']\n", "['2020-07-29 09', '49', '02,407', 'INFO', 'Extracting Trigrams']\n", "['2020-07-29 09', '49', '05,305', 'INFO', 'Fitting UMAP()']\n", "['2020-07-29 09', '49', '14,048', 'INFO', 'PyCaret Regression Module']\n", "['2020-07-29 09', '49', '14,048', 'INFO', 'version pycaret-nightly-0.39']\n", "['2020-07-29 09', '49', '14,048', 'INFO', 'Initializing setup()']\n", "['2020-07-29 09', '49', '14,049', 'INFO', 'USI', 'd354']\n", "['2020-07-29 09', '49', '14,049', 'INFO', 'setup(data=(1338, 7), target=charges, train_size=0.7, sampling=True, sample_estimator=None, categorical_features=None, categorical_imputation=constant, ordinal_features=None,']\n", "['high_cardinality_features=None, high_cardinality_method=frequency, numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=None, normalize=False,']\n", "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None, remove_outliers=False, outliers_threshold=0.05,']\n", "['remove_multicollinearity=False, multicollinearity_threshold=0.9, remove_perfect_collinearity=False, create_clusters=False, cluster_iter=20,']\n", "['polynomial_features=False, polynomial_degree=2, trigonometry_features=False, polynomial_threshold=0.1, group_features=None,']\n", "['group_names=None, feature_selection=False, feature_selection_threshold=0.8, feature_interaction=False, feature_ratio=False, interaction_threshold=0.01, transform_target=False,']\n", "['transform_target_method=box-cox, data_split_shuffle=True, folds_shuffle=False, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", "['experiment_name=insurance1, log_plots=False, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", "['2020-07-29 09', '49', '14,049', 'INFO', 'Checking environment']\n", "['2020-07-29 09', '49', '14,049', 'INFO', 'python_version', '3.6.10']\n", "['2020-07-29 09', '49', '14,050', 'INFO', 'python_build', \"('default', 'May 7 2020 19\", '46', \"08')\"]\n", "['2020-07-29 09', '49', '14,050', 'INFO', 'machine', 'AMD64']\n", "['2020-07-29 09', '49', '14,050', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", "['2020-07-29 09', '49', '14,097', 'INFO', 'Memory', 'svmem(total=17032478720, available=5629382656, percent=66.9, used=11403096064, free=5629382656)']\n", "['2020-07-29 09', '49', '14,097', 'INFO', 'Physical Core', '4']\n", "['2020-07-29 09', '49', '14,097', 'INFO', 'Logical Core', '8']\n", "['2020-07-29 09', '49', '14,097', 'INFO', 'Checking libraries']\n", "['2020-07-29 09', '49', '14,097', 'INFO', 'pd==1.0.4']\n", "['2020-07-29 09', '49', '14,098', 'INFO', 'numpy==1.18.5']\n", "['2020-07-29 09', '49', '14,935', 'INFO', 'sklearn==0.23.1']\n", "['2020-07-29 09', '49', '15,080', 'INFO', 'xgboost==1.1.1']\n", "['2020-07-29 09', '49', '15,220', 'INFO', 'lightgbm==2.3.1']\n", "['2020-07-29 09', '49', '15,339', 'INFO', 'catboost==0.23.2']\n", "['2020-07-29 09', '49', '16,374', 'INFO', 'mlflow==1.8.0']\n", "['2020-07-29 09', '49', '16,375', 'INFO', 'Checking Exceptions']\n", "['2020-07-29 09', '49', '16,375', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '49', '16,375', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '49', '16,408', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '49', '19,757', 'INFO', 'Copying data for preprocessing']\n", "['2020-07-29 09', '49', '19,758', 'INFO', 'Declaring global variables']\n", "['2020-07-29 09', '49', '19,777', 'INFO', 'Declaring preprocessing parameters']\n", "['2020-07-29 09', '49', '19,777', 'INFO', 'Importing preprocessing module']\n", "['2020-07-29 09', '49', '21,005', 'INFO', 'Creating preprocessing pipeline']\n", "['2020-07-29 09', '49', '22,813', 'INFO', 'Preprocessing pipeline created successfully']\n", "['2020-07-29 09', '49', '22,813', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '22,814', 'INFO', 'Creating grid variables']\n", "['2020-07-29 09', '49', '22,818', 'INFO', 'Creating global containers']\n", "['2020-07-29 09', '49', '22,997', 'INFO', 'Logging experiment in MLFlow']\n", "['2020-07-29 09', '49', '23,497', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '23,497', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '23,514', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", "['2020-07-29 09', '49', '23,514', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '23,528', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '23,556', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), None]']\n", "['2020-07-29 09', '49', '23,557', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '23,557', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '24,045', 'INFO', 'create_model_container', '0']\n", "['2020-07-29 09', '49', '24,045', 'INFO', 'master_model_container', '0']\n", "['2020-07-29 09', '49', '24,045', 'INFO', 'display_container', '0']\n", "['2020-07-29 09', '49', '24,045', 'INFO', 'setup() succesfully completed......................................']\n", "['2020-07-29 09', '49', '25,845', 'INFO', 'Initializing compare_models()']\n", "['2020-07-29 09', '49', '25,845', 'INFO', 'compare_models(blacklist=None, whitelist=None, fold=5, round=4, sort=R2, n_select=1, turbo=True, verbose=True)']\n", "['2020-07-29 09', '49', '25,845', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '49', '25,846', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '49', '25,846', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '49', '25,953', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '49', '25,957', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '49', '25,997', 'INFO', 'Importing untrained models']\n", "['2020-07-29 09', '49', '26,001', 'INFO', 'Import successful']\n", "['2020-07-29 09', '49', '26,023', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '49', '26,023', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '49', '26,023', 'INFO', 'Initializing Linear Regression']\n", "['2020-07-29 09', '49', '26,050', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '26,072', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '26,081', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '26,097', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '26,098', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '26,243', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '26,280', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '26,291', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '26,298', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '26,298', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '26,372', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '26,407', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '26,424', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '26,430', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '26,430', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '26,489', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '26,529', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '26,542', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '26,547', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '26,547', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '26,627', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '26,685', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '26,695', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '26,701', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '26,702', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '26,784', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '26,787', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '26,947', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '27,492', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '27,492', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '27,496', 'INFO', 'save_model(model=LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '49', '27,496', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '27,584', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '27,637', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), None]']\n", "['2020-07-29 09', '49', '27,638', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '27,638', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '27,641', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '49', '27,775', 'INFO', 'Initializing Lasso Regression']\n", "['2020-07-29 09', '49', '27,790', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '27,809', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '27,819', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '27,824', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '27,824', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '27,842', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '27,862', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '27,871', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '27,876', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '27,876', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '27,899', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '27,909', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '49', '27,910', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '27,921', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '27,931', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '27,939', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '27,939', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '27,968', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '27,993', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '28,006', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '28,013', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '28,014', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '28,044', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '28,072', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '28,083', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '28,091', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '28,091', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '28,118', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '28,119', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '28,162', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '28,366', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '28,367', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '28,367', 'INFO', 'save_model(model=Lasso(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=1000,']\n", "['normalize=False, positive=False, precompute=False, random_state=123,']\n", "[\"selection='cyclic', tol=0.0001, warm_start=False), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '49', '28,368', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '28,392', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '28,410', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), Lasso(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=1000,']\n", "['normalize=False, positive=False, precompute=False, random_state=123,']\n", "[\"selection='cyclic', tol=0.0001, warm_start=False), None]\"]\n", "['2020-07-29 09', '49', '28,410', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '28,410', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '28,583', 'INFO', 'Initializing Ridge Regression']\n", "['2020-07-29 09', '49', '28,598', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '28,599', 'INFO', \"save_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0), model_name=iforest, verbose=True)']\n", "['2020-07-29 09', '49', '28,600', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '28,607', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '28,630', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '28,638', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '28,645', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '28,645', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '28,663', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '28,682', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '28,692', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '28,697', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '28,697', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '28,720', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '28,744', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '28,752', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '28,758', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '28,759', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '28,766', 'INFO', 'iforest.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '28,782', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '28,787', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_L...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "[\"verbose=False), IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0)]']\n", "['2020-07-29 09', '49', '28,788', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '28,808', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '28,818', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '28,826', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '28,826', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '28,853', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '28,878', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '28,886', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '28,893', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '28,893', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '28,917', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '28,918', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '28,963', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '29,109', 'INFO', 'Initializing deploy_model()']\n", "['2020-07-29 09', '49', '29,111', 'INFO', \"deploy_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "[\"random_state=123, verbose=0), model_name=iforest-aws, authentication={'bucket'\", \"'pycaret-test'}, platform=aws)\"]\n", "['2020-07-29 09', '49', '29,111', 'INFO', 'Platform', 'AWS S3']\n", "['2020-07-29 09', '49', '29,245', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '29,245', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '29,246', 'INFO', 'save_model(model=Ridge(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=None,']\n", "[\"normalize=False, random_state=123, solver='auto', tol=0.001), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '49', '29,247', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '29,272', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '29,288', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), Ridge(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=None,']\n", "[\"normalize=False, random_state=123, solver='auto', tol=0.001), None]\"]\n", "['2020-07-29 09', '49', '29,289', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '29,289', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '29,429', 'INFO', 'Saving model in current working directory']\n", "['2020-07-29 09', '49', '29,430', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '29,430', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '29,430', 'INFO', \"save_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0), model_name=iforest-aws, verbose=False)']\n", "['2020-07-29 09', '49', '29,431', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '29,481', 'INFO', 'Initializing Elastic Net']\n", "['2020-07-29 09', '49', '29,503', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '29,528', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '29,540', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '29,545', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '29,546', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '29,573', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '29,595', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '29,606', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '29,614', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '29,615', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '29,654', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '29,677', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '29,689', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '29,697', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '29,697', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '29,698', 'INFO', 'iforest-aws.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '29,722', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_L...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "[\"verbose=False), IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0)]']\n", "['2020-07-29 09', '49', '29,722', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '29,723', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '29,723', 'INFO', 'Initializing S3 client']\n", "['2020-07-29 09', '49', '29,729', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '29,755', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '29,767', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '29,776', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '29,776', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '29,804', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '29,831', 'INFO', 'Fitting Model']\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "['2020-07-29 09', '49', '29,843', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '29,850', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '29,850', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '29,888', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '29,891', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '29,955', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '30,209', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '30,210', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '30,211', 'INFO', 'save_model(model=ElasticNet(alpha=1.0, copy_X=True, fit_intercept=True, l1_ratio=0.5,']\n", "['max_iter=1000, normalize=False, positive=False, precompute=False,']\n", "[\"random_state=123, selection='cyclic', tol=0.0001, warm_start=False), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '49', '30,211', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '30,234', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '30,256', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), ElasticNet(alpha=1.0, copy_X=True, fit_intercept=True, l1_ratio=0.5,']\n", "['max_iter=1000, normalize=False, positive=False, precompute=False,']\n", "[\"random_state=123, selection='cyclic', tol=0.0001, warm_start=False), None]\"]\n", "['2020-07-29 09', '49', '30,256', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '30,257', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '30,444', 'INFO', 'Initializing Least Angle Regression']\n", "['2020-07-29 09', '49', '30,464', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '30,487', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '30,514', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '30,521', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '30,521', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '30,546', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '30,571', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '30,595', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '30,600', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '30,600', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '30,630', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '30,652', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '30,670', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '30,677', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '30,678', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '30,704', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '30,731', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '30,752', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '30,759', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '30,759', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '30,783', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '30,813', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '30,830', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '30,838', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '30,839', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '30,858', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '30,859', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '30,898', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '31,084', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '31,084', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '31,085', 'INFO', 'save_model(model=Lars(copy_X=True, eps=2.220446049250313e-16, fit_intercept=True, fit_path=True,']\n", "[\"jitter=None, n_nonzero_coefs=500, normalize=True, precompute='auto',\"]\n", "['random_state=None, verbose=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '49', '31,085', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '31,100', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '31,113', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), Lars(copy_X=True, eps=2.220446049250313e-16, fit_intercept=True, fit_path=True,']\n", "[\"jitter=None, n_nonzero_coefs=500, normalize=True, precompute='auto',\"]\n", "['random_state=None, verbose=False), None]']\n", "['2020-07-29 09', '49', '31,114', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '31,114', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '31,259', 'INFO', 'Initializing Lasso Least Angle Regression']\n", "['2020-07-29 09', '49', '31,273', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '31,290', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '31,303', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '31,307', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '31,307', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '31,322', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '31,337', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '31,349', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '31,353', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '31,354', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '31,371', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '31,385', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '31,397', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '31,401', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '31,401', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '31,418', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '31,435', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '31,447', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '31,454', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '31,454', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '31,476', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '31,493', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '31,505', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '31,510', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '31,510', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '31,533', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '31,535', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '31,571', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '31,659', 'INFO', \"IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", "['random_state=123, verbose=0)']\n", "['2020-07-29 09', '49', '31,660', 'INFO', 'deploy_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '31,676', 'INFO', 'Initializing get_config()']\n", "['2020-07-29 09', '49', '31,677', 'INFO', 'get_config(variable=X)']\n", "['2020-07-29 09', '49', '31,677', 'INFO', 'Global variable', 'X returned']\n", "['2020-07-29 09', '49', '31,678', 'INFO', 'get_config() succesfully completed......................................']\n", "['2020-07-29 09', '49', '31,728', 'INFO', 'Initializing get_config()']\n", "['2020-07-29 09', '49', '31,729', 'INFO', 'get_config(variable=seed)']\n", "['2020-07-29 09', '49', '31,729', 'INFO', 'Global variable', 'seed returned']\n", "['2020-07-29 09', '49', '31,729', 'INFO', 'get_config() succesfully completed......................................']\n", "['2020-07-29 09', '49', '31,747', 'INFO', 'Initializing set_config()']\n", "['2020-07-29 09', '49', '31,748', 'INFO', 'set_config(variable=seed, value=999)']\n", "['2020-07-29 09', '49', '31,748', 'INFO', 'Global variable', 'seed updated']\n", "['2020-07-29 09', '49', '31,748', 'INFO', 'set_config() succesfully completed......................................']\n", "['2020-07-29 09', '49', '31,762', 'INFO', 'Initializing get_config()']\n", "['2020-07-29 09', '49', '31,763', 'INFO', 'get_config(variable=seed)']\n", "['2020-07-29 09', '49', '31,764', 'INFO', 'Global variable', 'seed returned']\n", "['2020-07-29 09', '49', '31,764', 'INFO', 'get_config() succesfully completed......................................']\n", "['2020-07-29 09', '49', '31,768', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '31,768', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '31,770', 'INFO', 'save_model(model=LassoLars(alpha=1.0, copy_X=True, eps=2.220446049250313e-16, fit_intercept=True,']\n", "['fit_path=True, jitter=None, max_iter=500, normalize=True,']\n", "[\"positive=False, precompute='auto', random_state=None, verbose=False), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '49', '31,770', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '31,804', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '31,838', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), LassoLars(alpha=1.0, copy_X=True, eps=2.220446049250313e-16, fit_intercept=True,']\n", "['fit_path=True, jitter=None, max_iter=500, normalize=True,']\n", "[\"positive=False, precompute='auto', random_state=None, verbose=False), None]\"]\n", "['2020-07-29 09', '49', '31,838', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '31,839', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '32,048', 'INFO', 'Initializing Orthogonal Matching Pursuit']\n", "['2020-07-29 09', '49', '32,071', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '32,100', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '32,114', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '32,120', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '32,121', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '32,149', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '32,171', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '32,182', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '32,189', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '32,190', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '32,214', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '32,239', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '32,251', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '32,259', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '32,259', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '32,293', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '32,320', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '32,332', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '32,339', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '32,340', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '32,364', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '32,391', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '32,401', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '32,410', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '32,410', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '32,438', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '32,439', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '32,496', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '32,721', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '32,721', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '32,722', 'INFO', 'save_model(model=OrthogonalMatchingPursuit(fit_intercept=True, n_nonzero_coefs=None,']\n", "[\"normalize=True, precompute='auto', tol=None), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '49', '32,723', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '32,747', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '32,777', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), OrthogonalMatchingPursuit(fit_intercept=True, n_nonzero_coefs=None,']\n", "[\"normalize=True, precompute='auto', tol=None), None]\"]\n", "['2020-07-29 09', '49', '32,778', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '32,778', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '33,009', 'INFO', 'Initializing Bayesian Ridge']\n", "['2020-07-29 09', '49', '33,039', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '33,069', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '33,090', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '33,097', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '33,097', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '33,123', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '33,148', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '33,166', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '33,174', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '33,174', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '33,201', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '33,231', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '33,253', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '33,263', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '33,264', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '33,299', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '33,329', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '33,346', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '33,355', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '33,356', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '33,388', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '33,414', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '33,433', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '33,441', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '33,441', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '33,467', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '33,469', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '33,543', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '33,846', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '33,846', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '33,848', 'INFO', 'save_model(model=BayesianRidge(alpha_1=1e-06, alpha_2=1e-06, alpha_init=None,']\n", "['compute_score=False, copy_X=True, fit_intercept=True,']\n", "['lambda_1=1e-06, lambda_2=1e-06, lambda_init=None, n_iter=300,']\n", "['normalize=False, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '49', '33,848', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '33,884', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '33,914', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), BayesianRidge(alpha_1=1e-06, alpha_2=1e-06, alpha_init=None,']\n", "['compute_score=False, copy_X=True, fit_intercept=True,']\n", "['lambda_1=1e-06, lambda_2=1e-06, lambda_init=None, n_iter=300,']\n", "['normalize=False, tol=0.001, verbose=False), None]']\n", "['2020-07-29 09', '49', '33,914', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '33,914', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '34,122', 'INFO', 'Initializing Passive Aggressive Regressor']\n", "['2020-07-29 09', '49', '34,147', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '34,176', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '34,202', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '34,208', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '34,208', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '34,230', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '34,248', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '34,269', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '34,274', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '34,275', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '34,299', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '34,327', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '34,354', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '34,362', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '34,363', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '34,396', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '34,425', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '34,454', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '34,458', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '34,459', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '34,488', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '34,517', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '34,543', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '34,551', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '34,552', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '34,582', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '34,584', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '34,638', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '34,855', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '34,855', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '34,857', 'INFO', 'save_model(model=PassiveAggressiveRegressor(C=1.0, average=False, early_stopping=False,']\n", "['epsilon=0.1, fit_intercept=True,']\n", "[\"loss='epsilon_insensitive', max_iter=1000,\"]\n", "['n_iter_no_change=5, random_state=123, shuffle=True,']\n", "['tol=0.001, validation_fraction=0.1, verbose=0,']\n", "['warm_start=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '49', '34,857', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '34,884', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '34,912', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), PassiveAggressiveRegressor(C=1.0, average=False, early_stopping=False,']\n", "['epsilon=0.1, fit_intercept=True,']\n", "[\"loss='epsilon_insensitive', max_iter=1000,\"]\n", "['n_iter_no_change=5, random_state=123, shuffle=True,']\n", "['tol=0.001, validation_fraction=0.1, verbose=0,']\n", "['warm_start=False), None]']\n", "['2020-07-29 09', '49', '34,912', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '34,912', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '35,070', 'INFO', 'Initializing Random Sample Consensus']\n", "['2020-07-29 09', '49', '35,086', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '35,110', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '35,317', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '35,323', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '35,324', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '35,341', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '35,357', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '35,576', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '35,580', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '35,581', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '35,600', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '35,617', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '35,900', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '35,907', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '35,908', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '35,938', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '35,965', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '36,277', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '36,283', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '36,283', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '36,307', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '36,328', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '36,615', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '36,620', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '36,620', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '36,638', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '36,639', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '36,682', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '36,866', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '36,866', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '36,867', 'INFO', 'save_model(model=RANSACRegressor(base_estimator=None, is_data_valid=None, is_model_valid=None,']\n", "[\"loss='absolute_loss', max_skips=inf, max_trials=100,\"]\n", "['min_samples=0.5, random_state=123, residual_threshold=None,']\n", "['stop_n_inliers=inf, stop_probability=0.99, stop_score=inf), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '49', '36,867', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '36,881', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '36,893', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), RANSACRegressor(base_estimator=None, is_data_valid=None, is_model_valid=None,']\n", "[\"loss='absolute_loss', max_skips=inf, max_trials=100,\"]\n", "['min_samples=0.5, random_state=123, residual_threshold=None,']\n", "['stop_n_inliers=inf, stop_probability=0.99, stop_score=inf), None]']\n", "['2020-07-29 09', '49', '36,893', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '36,894', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '37,043', 'INFO', 'Initializing TheilSen Regressor']\n", "['2020-07-29 09', '49', '37,062', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '37,081', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '45,284', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '45,289', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '45,289', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '45,308', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '45,327', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '47,087', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '47,092', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '47,093', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '47,110', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '47,130', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '48,914', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '48,918', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '48,919', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '48,938', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '48,960', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '50,969', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '50,974', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '50,974', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '50,997', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '51,022', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '52,626', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '52,633', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '52,633', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '52,651', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '52,651', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '52,706', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '53,189', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '53,190', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '53,191', 'INFO', 'save_model(model=TheilSenRegressor(copy_X=True, fit_intercept=True, max_iter=300,']\n", "['max_subpopulation=10000, n_jobs=-1, n_subsamples=None,']\n", "['random_state=123, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '49', '53,191', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '53,205', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '53,219', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), TheilSenRegressor(copy_X=True, fit_intercept=True, max_iter=300,']\n", "['max_subpopulation=10000, n_jobs=-1, n_subsamples=None,']\n", "['random_state=123, tol=0.001, verbose=False), None]']\n", "['2020-07-29 09', '49', '53,220', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '53,220', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '53,380', 'INFO', 'Initializing Huber Regressor']\n", "['2020-07-29 09', '49', '53,393', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '53,418', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '53,583', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '53,587', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '53,587', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '53,608', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '53,627', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '53,750', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '53,755', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '53,755', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '53,775', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '53,797', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '53,937', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '53,943', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '53,944', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '53,964', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '53,987', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '54,134', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '54,141', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '54,141', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '54,160', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '54,180', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '54,320', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '54,325', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '54,326', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '54,347', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '54,348', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '54,389', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '54,547', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '54,547', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '54,547', 'INFO', 'save_model(model=HuberRegressor(alpha=0.0001, epsilon=1.35, fit_intercept=True, max_iter=100,']\n", "['tol=1e-05, warm_start=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '49', '54,548', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '54,560', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '54,572', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), HuberRegressor(alpha=0.0001, epsilon=1.35, fit_intercept=True, max_iter=100,']\n", "['tol=1e-05, warm_start=False), None]']\n", "['2020-07-29 09', '49', '54,573', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '54,573', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '54,742', 'INFO', 'Initializing Support Vector Machine']\n", "['2020-07-29 09', '49', '54,758', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '54,775', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '54,906', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '54,927', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '54,928', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '54,956', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '54,983', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '55,088', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '55,109', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '55,109', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '55,136', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '55,173', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '55,286', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '55,308', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '55,309', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '55,353', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '55,376', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '55,499', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '55,525', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '55,525', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '55,579', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '55,643', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '55,789', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '55,814', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '55,815', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '55,874', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '55,877', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '55,972', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '56,261', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '56,261', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '56,263', 'INFO', \"save_model(model=SVR(C=1.0, cache_size=200, coef0=0.0, degree=3, epsilon=0.1, gamma='scale',\"]\n", "[\"kernel='rbf', max_iter=-1, shrinking=True, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '49', '56,263', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '56,290', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '56,309', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), SVR(C=1.0, cache_size=200, coef0=0.0, degree=3, epsilon=0.1, gamma='scale',\"]\n", "[\"kernel='rbf', max_iter=-1, shrinking=True, tol=0.001, verbose=False), None]\"]\n", "['2020-07-29 09', '49', '56,309', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '56,310', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '56,443', 'INFO', 'Initializing K Neighbors Regressor']\n", "['2020-07-29 09', '49', '56,461', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '56,479', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '56,490', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '56,608', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '56,608', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '56,633', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '56,648', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '56,658', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '56,771', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '56,772', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '56,792', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '56,812', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '56,829', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '56,946', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '56,946', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '56,965', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '56,984', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '56,995', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '57,106', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '57,107', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '57,121', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '57,136', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '57,143', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '57,254', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '57,254', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '57,273', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '57,273', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '57,305', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '57,442', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '57,442', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '57,443', 'INFO', \"save_model(model=KNeighborsRegressor(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", "[\"weights='uniform'), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '49', '57,443', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '57,456', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '57,468', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), KNeighborsRegressor(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", "[\"weights='uniform'), None]\"]\n", "['2020-07-29 09', '49', '57,469', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '57,469', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '57,561', 'INFO', 'Initializing Decision Tree']\n", "['2020-07-29 09', '49', '57,572', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '57,586', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '57,595', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '57,599', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '57,599', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '57,611', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '57,626', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '57,641', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '57,646', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '57,647', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '57,671', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '57,697', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '57,714', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '57,720', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '57,721', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '57,747', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '49', '57,776', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '57,794', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '57,802', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '57,802', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '57,827', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '49', '57,844', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '57,856', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '57,861', 'INFO', 'No inverse transformer found']\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "['2020-07-29 09', '49', '57,861', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '57,880', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '49', '57,882', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '49', '57,920', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '49', '58,087', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '49', '58,088', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '49', '58,089', 'INFO', \"save_model(model=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", "['max_features=None, max_leaf_nodes=None,']\n", "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", "['min_samples_leaf=1, min_samples_split=2,']\n", "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", "['2020-07-29 09', '49', '58,090', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '49', '58,105', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '49', '58,125', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", "['max_features=None, max_leaf_nodes=None,']\n", "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", "['min_samples_leaf=1, min_samples_split=2,']\n", "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", "[\"random_state=123, splitter='best'), None]\"]\n", "['2020-07-29 09', '49', '58,126', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '49', '58,126', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '49', '58,253', 'INFO', 'Initializing Random Forest']\n", "['2020-07-29 09', '49', '58,267', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '49', '58,286', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '58,838', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '58,950', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '58,951', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '58,967', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '49', '58,988', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '49', '59,551', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '49', '59,666', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '49', '59,667', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '49', '59,693', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '49', '59,726', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '00,434', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '00,551', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '00,552', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '00,569', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '50', '00,585', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '01,120', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '01,231', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '01,232', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '01,249', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '50', '01,269', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '01,827', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '01,937', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '01,937', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '01,951', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '50', '01,952', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '50', '01,989', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '50', '02,150', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '50', '02,150', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '50', '02,151', 'INFO', \"save_model(model=RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", "['max_samples=None, min_impurity_decrease=0.0,']\n", "['min_impurity_split=None, min_samples_leaf=1,']\n", "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '50', '02,151', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '50', '02,248', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '50', '02,262', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", "['max_samples=None, min_impurity_decrease=0.0,']\n", "['min_impurity_split=None, min_samples_leaf=1,']\n", "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", "['random_state=123, verbose=0, warm_start=False), None]']\n", "['2020-07-29 09', '50', '02,263', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '02,263', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '50', '02,392', 'INFO', 'Initializing Extra Trees Regressor']\n", "['2020-07-29 09', '50', '02,406', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '50', '02,420', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '02,827', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '02,938', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '02,938', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '02,953', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '50', '02,969', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '03,270', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '03,380', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '03,380', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '03,395', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '50', '03,411', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '03,707', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '03,821', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '03,821', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '03,841', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '50', '03,855', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '04,177', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '04,286', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '04,286', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '04,302', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '50', '04,315', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '04,609', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '04,719', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '04,719', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '04,731', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '50', '04,732', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '50', '04,773', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '50', '04,942', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '50', '04,942', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '50', '04,943', 'INFO', \"save_model(model=ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", "['max_samples=None, min_impurity_decrease=0.0,']\n", "['min_impurity_split=None, min_samples_leaf=1,']\n", "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '50', '04,943', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '50', '05,031', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '50', '05,043', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", "['max_samples=None, min_impurity_decrease=0.0,']\n", "['min_impurity_split=None, min_samples_leaf=1,']\n", "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", "['random_state=123, verbose=0, warm_start=False), None]']\n", "['2020-07-29 09', '50', '05,043', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '05,043', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '50', '05,162', 'INFO', 'Initializing AdaBoost Regressor']\n", "['2020-07-29 09', '50', '05,174', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '50', '05,191', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '05,255', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '05,260', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '05,260', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '05,273', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '50', '05,288', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '05,331', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '05,337', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '05,337', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '05,349', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '50', '05,363', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '05,396', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '05,402', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '05,402', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '05,416', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '50', '05,434', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '05,466', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '05,471', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '05,472', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '05,486', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '50', '05,500', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '05,548', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '05,555', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '05,555', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '05,569', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '50', '05,570', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '50', '05,608', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '50', '05,786', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '50', '05,786', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '50', '05,786', 'INFO', \"save_model(model=AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '50', '05,786', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '50', '05,802', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '50', '05,813', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", "['n_estimators=50, random_state=123), None]']\n", "['2020-07-29 09', '50', '05,813', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '05,814', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '50', '05,897', 'INFO', 'Initializing Gradient Boosting Regressor']\n", "['2020-07-29 09', '50', '05,908', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '50', '05,922', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '06,084', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '06,089', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '06,089', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '06,101', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '50', '06,113', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '06,270', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '06,273', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '06,273', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '06,285', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '50', '06,299', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '06,448', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '06,452', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '06,452', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '06,464', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '50', '06,479', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '06,630', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '06,634', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '06,634', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '06,645', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '50', '06,659', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '06,809', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '06,813', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '06,813', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '06,824', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '50', '06,825', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '50', '06,856', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '50', '07,002', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '50', '07,002', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '50', '07,003', 'INFO', \"save_model(model=GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", "['max_features=None, max_leaf_nodes=None,']\n", "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", "['min_samples_leaf=1, min_samples_split=2,']\n", "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", "[\"n_iter_no_change=None, presort='deprecated',\"]\n", "['random_state=123, subsample=1.0, tol=0.0001,']\n", "['validation_fraction=0.1, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '50', '07,003', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '50', '07,018', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '50', '07,028', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", "['max_features=None, max_leaf_nodes=None,']\n", "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", "['min_samples_leaf=1, min_samples_split=2,']\n", "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", "[\"n_iter_no_change=None, presort='deprecated',\"]\n", "['random_state=123, subsample=1.0, tol=0.0001,']\n", "['validation_fraction=0.1, verbose=0, warm_start=False), None]']\n", "['2020-07-29 09', '50', '07,029', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '07,029', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '50', '07,161', 'INFO', 'Initializing Extreme Gradient Boosting']\n", "['2020-07-29 09', '50', '07,173', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '50', '07,190', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '07,362', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '07,368', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '07,369', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '07,394', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '50', '07,416', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '07,586', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '07,592', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '07,592', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '07,620', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '50', '07,643', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '07,828', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '07,834', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '07,834', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '07,863', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '50', '07,887', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '08,074', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '08,081', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '08,081', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '08,110', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '50', '08,135', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '08,339', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '08,346', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '08,346', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '08,375', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '50', '08,376', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '50', '08,448', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '50', '08,679', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '50', '08,680', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '50', '08,686', 'INFO', \"save_model(model=XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", "['colsample_bynode=1, colsample_bytree=1, gamma=0, gpu_id=-1,']\n", "[\"importance_type='gain', interaction_constraints='',\"]\n", "['learning_rate=0.300000012, max_delta_step=0, max_depth=6,']\n", "[\"min_child_weight=1, missing=nan, monotone_constraints='()',\"]\n", "['n_estimators=100, n_jobs=-1, num_parallel_tree=1,']\n", "[\"objective='reg\", \"squarederror', random_state=123, reg_alpha=0,\"]\n", "[\"reg_lambda=1, scale_pos_weight=1, subsample=1, tree_method='exact',\"]\n", "['validate_parameters=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '50', '08,686', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '50', '08,711', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '50', '08,730', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", "['colsample_bynode=1, colsample_bytree=1, gamma=0, gpu_id=-1,']\n", "[\"importance_type='gain', interaction_constraints='',\"]\n", "['learning_rate=0.300000012, max_delta_step=0, max_depth=6,']\n", "[\"min_child_weight=1, missing=nan, monotone_constraints='()',\"]\n", "['n_estimators=100, n_jobs=-1, num_parallel_tree=1,']\n", "[\"objective='reg\", \"squarederror', random_state=123, reg_alpha=0,\"]\n", "[\"reg_lambda=1, scale_pos_weight=1, subsample=1, tree_method='exact',\"]\n", "['validate_parameters=1, verbosity=0), None]']\n", "['2020-07-29 09', '50', '08,730', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '08,730', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '50', '08,868', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", "['2020-07-29 09', '50', '08,881', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '50', '08,901', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '09,213', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '09,226', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '09,226', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '09,258', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '50', '09,282', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '09,525', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '09,535', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '09,535', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '09,567', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '50', '09,592', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '09,871', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '09,882', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '09,882', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '09,913', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '50', '09,938', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '10,228', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '10,241', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '10,241', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '10,271', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '50', '10,299', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '10,568', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '10,579', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '10,579', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '10,610', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '50', '10,612', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '50', '10,683', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '50', '10,933', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '50', '10,933', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '50', '10,936', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '50', '10,936', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '50', '10,982', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '50', '11,014', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", "['2020-07-29 09', '50', '11,015', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '11,015', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '50', '11,186', 'INFO', 'Initializing CatBoost Regressor']\n", "['2020-07-29 09', '50', '11,198', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '50', '11,213', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '15,134', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '15,140', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '15,140', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '15,156', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '50', '15,174', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '19,173', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '19,181', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '19,181', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '19,199', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '50', '19,214', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '20,317', 'INFO', 'PyCaret Clustering Module']\n", "['2020-07-29 09', '50', '20,317', 'INFO', 'version pycaret-nightly-0.39']\n", "['2020-07-29 09', '50', '20,317', 'INFO', 'Initializing setup()']\n", "['2020-07-29 09', '50', '20,317', 'INFO', 'USI', 'a262']\n", "['2020-07-29 09', '50', '20,318', 'INFO', 'setup(data=(224, 21), categorical_features=None, categorical_imputation=constant, ordinal_features=None, high_cardinality_features=None,']\n", "[\"numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=['Country Name'], normalize=False,\"]\n", "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None,']\n", "['remove_multicollinearity=False, multicollinearity_threshold=0.9, group_features=None,']\n", "['group_names=None, supervised=False, supervised_target=None, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", "['experiment_name=health1, log_plots=True, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", "['2020-07-29 09', '50', '20,318', 'INFO', 'Checking environment']\n", "['2020-07-29 09', '50', '20,318', 'INFO', 'python_version', '3.6.10']\n", "['2020-07-29 09', '50', '20,318', 'INFO', 'python_build', \"('default', 'May 7 2020 19\", '46', \"08')\"]\n", "['2020-07-29 09', '50', '20,318', 'INFO', 'machine', 'AMD64']\n", "['2020-07-29 09', '50', '20,319', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", "['2020-07-29 09', '50', '20,400', 'INFO', 'Memory', 'svmem(total=17032478720, available=4871823360, percent=71.4, used=12160655360, free=4871823360)']\n", "['2020-07-29 09', '50', '20,402', 'INFO', 'Physical Core', '4']\n", "['2020-07-29 09', '50', '20,402', 'INFO', 'Logical Core', '8']\n", "['2020-07-29 09', '50', '20,402', 'INFO', 'Checking libraries']\n", "['2020-07-29 09', '50', '20,402', 'INFO', 'pd==1.0.4']\n", "['2020-07-29 09', '50', '20,402', 'INFO', 'numpy==1.18.5']\n", "['2020-07-29 09', '50', '22,550', 'INFO', 'sklearn==0.23.1']\n", "['2020-07-29 09', '50', '22,554', 'INFO', 'kmodes==0.10.2']\n", "['2020-07-29 09', '50', '23,217', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '23,224', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '23,224', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '23,238', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '50', '23,257', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '25,615', 'INFO', 'mlflow==1.8.0']\n", "['2020-07-29 09', '50', '25,615', 'INFO', 'Checking Exceptions']\n", "['2020-07-29 09', '50', '25,616', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '50', '25,827', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '50', '25,889', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '50', '25,889', 'INFO', 'Declaring global variables']\n", "['2020-07-29 09', '50', '25,889', 'INFO', 'Copying data for preprocessing']\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "['2020-07-29 09', '50', '25,902', 'INFO', 'Declaring preprocessing parameters']\n", "['2020-07-29 09', '50', '25,902', 'INFO', 'Importing preprocessing module']\n", "['2020-07-29 09', '50', '27,230', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '27,237', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '27,237', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '27,252', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '50', '27,271', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '29,232', 'INFO', 'Creating preprocessing pipeline']\n", "['2020-07-29 09', '50', '31,016', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '31,022', 'INFO', 'No inverse transformer found']\n", "['2020-07-29 09', '50', '31,022', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '31,035', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '50', '31,036', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '50', '31,082', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '50', '31,207', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '50', '31,207', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '50', '31,207', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '50', '31,207', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '50', '31,227', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '50', '31,240', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "['verbose=False), , None]']\n", "['2020-07-29 09', '50', '31,240', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '31,240', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '50', '31,614', 'INFO', 'Finalizing top_n models']\n", "['2020-07-29 09', '50', '31,615', 'INFO', 'SubProcess create_model() called ==================================']\n", "['2020-07-29 09', '50', '31,630', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '50', '31,630', 'INFO', 'create_model(estimator=gbr, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", "['2020-07-29 09', '50', '31,630', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '50', '31,630', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '50', '31,631', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '50', '31,652', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '50', '31,653', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '50', '31,655', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '50', '31,655', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '50', '31,656', 'INFO', 'Gradient Boosting Regressor Imported succesfully']\n", "['2020-07-29 09', '50', '31,657', 'INFO', 'Checking ensemble method']\n", "['2020-07-29 09', '50', '31,659', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '50', '31,662', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '31,827', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '31,831', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '31,832', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '31,846', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '50', '31,848', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '32,015', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '32,017', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '32,018', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '32,029', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '50', '32,031', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '32,183', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '32,187', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '32,187', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '32,198', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '50', '32,201', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '32,348', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '32,351', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '32,352', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '32,362', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '50', '32,364', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '32,528', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '32,532', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '32,532', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '32,544', 'INFO', 'Initializing Fold 6']\n", "['2020-07-29 09', '50', '32,547', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '32,700', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '32,704', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '32,704', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '32,714', 'INFO', 'Initializing Fold 7']\n", "['2020-07-29 09', '50', '32,716', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '32,866', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '32,869', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '32,869', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '32,881', 'INFO', 'Initializing Fold 8']\n", "['2020-07-29 09', '50', '32,885', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '33,045', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '33,049', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '33,050', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '33,061', 'INFO', 'Initializing Fold 9']\n", "['2020-07-29 09', '50', '33,064', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '33,222', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '33,225', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '33,226', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '33,235', 'INFO', 'Initializing Fold 10']\n", "['2020-07-29 09', '50', '33,237', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '33,386', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '33,389', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '33,389', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '33,399', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '50', '33,400', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '50', '33,408', 'INFO', 'Finalizing model']\n", "['2020-07-29 09', '50', '33,570', 'INFO', 'Uploading results into container']\n", "['2020-07-29 09', '50', '33,570', 'INFO', 'Uploading model into container']\n", "['2020-07-29 09', '50', '33,570', 'INFO', 'create_model_container', '1']\n", "['2020-07-29 09', '50', '33,571', 'INFO', 'master_model_container', '1']\n", "['2020-07-29 09', '50', '33,571', 'INFO', 'display_container', '1']\n", "['2020-07-29 09', '50', '33,572', 'INFO', \"GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", "['max_features=None, max_leaf_nodes=None,']\n", "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", "['min_samples_leaf=1, min_samples_split=2,']\n", "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", "[\"n_iter_no_change=None, presort='deprecated',\"]\n", "['random_state=123, subsample=1.0, tol=0.0001,']\n", "['validation_fraction=0.1, verbose=0, warm_start=False)']\n", "['2020-07-29 09', '50', '33,572', 'INFO', 'create_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '33,572', 'INFO', 'SubProcess create_model() end ==================================']\n", "['2020-07-29 09', '50', '33,736', 'INFO', 'create_model_container', '1']\n", "['2020-07-29 09', '50', '33,736', 'INFO', 'master_model_container', '1']\n", "['2020-07-29 09', '50', '33,736', 'INFO', 'display_container', '2']\n", "['2020-07-29 09', '50', '33,737', 'INFO', \"GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", "['max_features=None, max_leaf_nodes=None,']\n", "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", "['min_samples_leaf=1, min_samples_split=2,']\n", "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", "[\"n_iter_no_change=None, presort='deprecated',\"]\n", "['random_state=123, subsample=1.0, tol=0.0001,']\n", "['validation_fraction=0.1, verbose=0, warm_start=False)']\n", "['2020-07-29 09', '50', '33,737', 'INFO', 'compare_models() succesfully completed......................................']\n", "['2020-07-29 09', '50', '38,592', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '50', '38,593', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", "['2020-07-29 09', '50', '38,593', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '50', '38,593', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '50', '38,593', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '50', '38,629', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '50', '38,630', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '50', '38,631', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '50', '38,631', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '50', '38,639', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", "['2020-07-29 09', '50', '38,640', 'INFO', 'Checking ensemble method']\n", "['2020-07-29 09', '50', '38,647', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '50', '38,656', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '38,849', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '38,857', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '38,857', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '38,908', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '50', '38,925', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '39,151', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '39,159', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '39,159', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '39,219', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '50', '39,239', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '39,508', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '39,518', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '39,518', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '39,580', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '50', '39,603', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '39,908', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '39,919', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '39,920', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '39,994', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '50', '40,018', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '40,307', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '40,315', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '40,316', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '40,402', 'INFO', 'Initializing Fold 6']\n", "['2020-07-29 09', '50', '40,424', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '40,753', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '40,763', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '40,764', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '40,860', 'INFO', 'Initializing Fold 7']\n", "['2020-07-29 09', '50', '40,885', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '41,203', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '41,212', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '41,213', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '41,289', 'INFO', 'Initializing Fold 8']\n", "['2020-07-29 09', '50', '41,312', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '41,654', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '41,665', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '41,665', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '41,742', 'INFO', 'Initializing Fold 9']\n", "['2020-07-29 09', '50', '41,764', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '42,039', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '42,049', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '42,050', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '42,129', 'INFO', 'Initializing Fold 10']\n", "['2020-07-29 09', '50', '42,151', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '42,228', 'INFO', 'Preprocessing pipeline created successfully']\n", "['2020-07-29 09', '50', '42,228', 'INFO', 'Creating grid variables']\n", "['2020-07-29 09', '50', '42,233', 'INFO', 'Creating global containers']\n", "['2020-07-29 09', '50', '42,511', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '42,521', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '42,521', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '42,601', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '50', '42,606', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '50', '42,633', 'INFO', 'Finalizing model']\n", "['2020-07-29 09', '50', '42,983', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '50', '43,314', 'INFO', 'Logging experiment in MLFlow']\n", "['2020-07-29 09', '50', '43,501', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '50', '43,502', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '50', '43,503', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '50', '43,504', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '50', '43,542', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '50', '43,572', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", "['2020-07-29 09', '50', '43,573', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '43,573', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '50', '43,664', 'INFO', 'Uploading results into container']\n", "['2020-07-29 09', '50', '43,664', 'INFO', 'Uploading model into container']\n", "['2020-07-29 09', '50', '43,819', 'INFO', 'create_model_container', '2']\n", "['2020-07-29 09', '50', '43,819', 'INFO', 'master_model_container', '2']\n", "['2020-07-29 09', '50', '43,819', 'INFO', 'display_container', '3']\n", "['2020-07-29 09', '50', '43,821', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", "['2020-07-29 09', '50', '43,821', 'INFO', 'create_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '43,841', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '50', '43,842', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=True)']\n", "['2020-07-29 09', '50', '43,842', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '50', '43,843', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '50', '43,843', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '50', '43,885', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '50', '43,886', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '50', '43,889', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '50', '43,889', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '50', '43,890', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", "['2020-07-29 09', '50', '43,893', 'INFO', 'Checking ensemble method']\n", "['2020-07-29 09', '50', '43,895', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '50', '43,901', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '44,135', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '50', '44,136', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '50', '44,171', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", "['2020-07-29 09', '50', '44,172', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '50', '44,203', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", "['2020-07-29 09', '50', '44,258', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "['verbose=False), Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "['verbose=False)]']\n", "['2020-07-29 09', '50', '44,258', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '44,259', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '50', '44,437', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '44,448', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '44,448', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '44,477', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '50', '44,483', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '44,521', 'INFO', 'Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "['verbose=False)']\n", "['2020-07-29 09', '50', '44,521', 'INFO', 'setup() succesfully completed......................................']\n", "['2020-07-29 09', '50', '44,623', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '50', '44,624', 'INFO', 'create_model(model=kmeans, num_clusters=4, ground_truth=None, verbose=True, system=True)']\n", "['2020-07-29 09', '50', '44,625', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '50', '44,625', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '50', '44,625', 'INFO', 'Setting num_cluster param']\n", "['2020-07-29 09', '50', '44,626', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '50', '44,690', 'INFO', 'Importing untrained model']\n", "['2020-07-29 09', '50', '44,690', 'INFO', 'K-Means Clustering Imported succesfully']\n", "['2020-07-29 09', '50', '44,711', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '44,901', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '44,946', 'INFO', 'Creating Metrics dataframe']\n", "['2020-07-29 09', '50', '44,956', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '50', '45,024', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '45,037', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '45,038', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '45,068', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '50', '45,074', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '45,271', 'INFO', 'SubProcess plot_model() called ==================================']\n", "['2020-07-29 09', '50', '45,271', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '50', '45,273', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=cluster, feature=None, label=False, save=True, system=False)']\n", "['2020-07-29 09', '50', '45,273', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '50', '45,273', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '50', '45,551', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '45,564', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '45,565', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '45,597', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '50', '45,608', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '46,101', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '46,111', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '46,112', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '46,140', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '50', '46,145', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '46,487', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '46,498', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '46,499', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '46,530', 'INFO', 'Initializing Fold 6']\n", "['2020-07-29 09', '50', '46,538', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '46,999', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '47,011', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '47,011', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '47,042', 'INFO', 'Initializing Fold 7']\n", "['2020-07-29 09', '50', '47,047', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '47,395', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '47,408', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '47,408', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '47,437', 'INFO', 'Initializing Fold 8']\n", "['2020-07-29 09', '50', '47,442', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '47,856', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '47,866', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '47,867', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '47,897', 'INFO', 'Initializing Fold 9']\n", "['2020-07-29 09', '50', '47,905', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '48,279', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '48,290', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '48,291', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '48,325', 'INFO', 'Initializing Fold 10']\n", "['2020-07-29 09', '50', '48,330', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '48,701', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '48,712', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '48,713', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '48,743', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '50', '48,748', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '50', '48,768', 'INFO', 'Finalizing model']\n", "['2020-07-29 09', '50', '49,134', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '50', '49,651', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '50', '49,651', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '50', '49,652', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '50', '49,653', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '50', '49,697', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '50', '49,727', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", "['2020-07-29 09', '50', '49,728', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '49,728', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '50', '49,815', 'INFO', 'Uploading results into container']\n", "['2020-07-29 09', '50', '49,815', 'INFO', 'Uploading model into container']\n", "['2020-07-29 09', '50', '49,815', 'INFO', 'create_model_container', '3']\n", "['2020-07-29 09', '50', '49,815', 'INFO', 'master_model_container', '3']\n", "['2020-07-29 09', '50', '49,815', 'INFO', 'display_container', '4']\n", "['2020-07-29 09', '50', '49,817', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", "['2020-07-29 09', '50', '49,817', 'INFO', 'create_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '49,818', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '50', '49,818', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=True)']\n", "['2020-07-29 09', '50', '49,818', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '50', '49,818', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '50', '49,819', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '50', '49,851', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '50', '49,852', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '50', '49,855', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '50', '49,855', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '50', '49,857', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", "['2020-07-29 09', '50', '49,860', 'INFO', 'Checking ensemble method']\n", "['2020-07-29 09', '50', '49,862', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '50', '49,868', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '50,229', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '50,237', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '50,238', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '50,268', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '50', '50,273', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '50,640', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '50,650', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '50,650', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '50,680', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '50', '50,687', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '51,379', 'INFO', 'plot type', 'cluster']\n", "['2020-07-29 09', '50', '51,379', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '50', '51,379', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '50', '51,381', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", "['2020-07-29 09', '50', '51,381', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '50', '51,382', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '50', '51,382', 'INFO', 'Copying data']\n", "['2020-07-29 09', '50', '51,383', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", "['2020-07-29 09', '50', '51,383', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '50', '51,441', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '50', '51,443', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '50', '51,443', 'INFO', '(224, 21)']\n", "['2020-07-29 09', '50', '51,444', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '51,444', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '50', '51,481', 'INFO', 'Fitting PCA()']\n", "['2020-07-29 09', '50', '51,501', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '50', '51,510', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '50', '51,800', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '51,811', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '51,811', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '51,840', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '50', '51,855', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '52,980', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '52,992', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '52,993', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '53,024', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '50', '53,029', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '53,902', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '53,914', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '53,914', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '53,950', 'INFO', 'Initializing Fold 6']\n", "['2020-07-29 09', '50', '53,955', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '54,501', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '54,512', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '54,512', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '54,544', 'INFO', 'Initializing Fold 7']\n", "['2020-07-29 09', '50', '54,549', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '55,374', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '55,384', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '55,384', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '55,410', 'INFO', 'Initializing Fold 8']\n", "['2020-07-29 09', '50', '55,415', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '55,458', 'INFO', 'PyCaret NLP Module']\n", "['2020-07-29 09', '50', '55,459', 'INFO', 'version pycaret-nightly-0.39']\n", "['2020-07-29 09', '50', '55,459', 'INFO', 'Initializing setup()']\n", "['2020-07-29 09', '50', '55,460', 'INFO', 'USI', '2c3d']\n", "['2020-07-29 09', '50', '55,460', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=True, session_id=123, log_experiment=True,']\n", "['experiment_name=kiva1, log_plots=True, log_data=False, verbose=True)']\n", "['2020-07-29 09', '50', '55,460', 'INFO', 'Checking environment']\n", "['2020-07-29 09', '50', '55,461', 'INFO', 'python_version', '3.6.10']\n", "['2020-07-29 09', '50', '55,461', 'INFO', 'python_build', \"('default', 'May 7 2020 19\", '46', \"08')\"]\n", "['2020-07-29 09', '50', '55,461', 'INFO', 'machine', 'AMD64']\n", "['2020-07-29 09', '50', '55,462', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", "['2020-07-29 09', '50', '55,546', 'INFO', 'Memory', 'svmem(total=17032478720, available=4700733440, percent=72.4, used=12331745280, free=4700733440)']\n", "['2020-07-29 09', '50', '55,546', 'INFO', 'Physical Core', '4']\n", "['2020-07-29 09', '50', '55,547', 'INFO', 'Logical Core', '8']\n", "['2020-07-29 09', '50', '55,547', 'INFO', 'Checking libraries']\n", "['2020-07-29 09', '50', '55,547', 'INFO', 'pd==1.0.4']\n", "['2020-07-29 09', '50', '55,547', 'INFO', 'numpy==1.18.5']\n", "['2020-07-29 09', '50', '55,982', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '55,993', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '55,993', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '56,032', 'INFO', 'Initializing Fold 9']\n", "['2020-07-29 09', '50', '56,038', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '56,505', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '56,516', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '56,516', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '56,545', 'INFO', 'Initializing Fold 10']\n", "['2020-07-29 09', '50', '56,551', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '57,714', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '50', '57,725', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '50', '57,725', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '50', '57,754', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '50', '57,759', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '50', '57,779', 'INFO', 'Finalizing model']\n", "['2020-07-29 09', '50', '58,308', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '50', '58,410', 'INFO', 'gensim==3.8.3']\n", "['2020-07-29 09', '50', '58,896', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '50', '58,897', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '50', '58,899', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '50', '58,899', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '50', '58,945', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '50', '58,978', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", "['2020-07-29 09', '50', '58,978', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '58,979', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '50', '59,072', 'INFO', 'Uploading results into container']\n", "['2020-07-29 09', '50', '59,072', 'INFO', 'Uploading model into container']\n", "['2020-07-29 09', '50', '59,072', 'INFO', 'create_model_container', '4']\n", "['2020-07-29 09', '50', '59,072', 'INFO', 'master_model_container', '4']\n", "['2020-07-29 09', '50', '59,073', 'INFO', 'display_container', '5']\n", "['2020-07-29 09', '50', '59,074', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", "['2020-07-29 09', '50', '59,075', 'INFO', 'create_model() succesfully completed......................................']\n", "['2020-07-29 09', '50', '59,075', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '50', '59,075', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=True)']\n", "['2020-07-29 09', '50', '59,076', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '50', '59,076', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '50', '59,076', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '50', '59,110', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '50', '59,112', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '50', '59,115', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '50', '59,115', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '50', '59,116', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", "['2020-07-29 09', '50', '59,120', 'INFO', 'Checking ensemble method']\n", "['2020-07-29 09', '50', '59,122', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '50', '59,129', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '50', '59,817', 'INFO', 'spacy==2.2.4']\n", "['2020-07-29 09', '51', '00,027', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '00,037', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '00,037', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '00,072', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '51', '00,081', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '00,692', 'INFO', \"Saving 'Cluster.html' in current active directory\"]\n", "['2020-07-29 09', '51', '00,692', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '00,692', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '00,907', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '00,919', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '00,919', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '00,948', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '51', '00,954', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '01,313', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '01,323', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '01,323', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '01,349', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '51', '01,354', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '01,554', 'INFO', 'nltk==3.5']\n", "['2020-07-29 09', '51', '01,706', 'INFO', 'textblob==0.15.3']\n", "['2020-07-29 09', '51', '01,774', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '01,783', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '01,783', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '01,814', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '51', '01,819', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '02,155', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '02,165', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '02,165', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '02,189', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '51', '02,190', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=distribution, feature=None, label=False, save=True, system=False)']\n", "['2020-07-29 09', '51', '02,191', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '02,191', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '02,194', 'INFO', 'Initializing Fold 6']\n", "['2020-07-29 09', '51', '02,200', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '02,220', 'INFO', 'plot type', 'distribution']\n", "['2020-07-29 09', '51', '02,221', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '51', '02,221', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '51', '02,223', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=False, verbose=False)']\n", "['2020-07-29 09', '51', '02,224', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '02,224', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '02,224', 'INFO', 'Copying data']\n", "['2020-07-29 09', '51', '02,225', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '02,271', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '51', '02,273', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '51', '02,274', 'INFO', '(224, 22)']\n", "['2020-07-29 09', '51', '02,274', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '02,274', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '51', '02,275', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '51', '02,294', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '51', '02,690', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '02,701', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '02,701', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '02,728', 'INFO', 'Initializing Fold 7']\n", "['2020-07-29 09', '51', '02,734', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '03,122', 'INFO', \"Saving 'Distribution.html' in current active directory\"]\n", "['2020-07-29 09', '51', '03,122', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '03,122', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '03,236', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '03,240', 'INFO', 'pyLDAvis==2.1.2']\n", "['2020-07-29 09', '51', '03,244', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '03,244', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '03,273', 'INFO', 'Initializing Fold 8']\n", "['2020-07-29 09', '51', '03,278', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '03,482', 'INFO', 'wordcloud==1.7.0']\n", "['2020-07-29 09', '51', '03,624', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '03,636', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '03,637', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '03,663', 'INFO', 'Initializing Fold 9']\n", "['2020-07-29 09', '51', '03,668', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '03,979', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '03,989', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '03,989', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '04,017', 'INFO', 'Initializing Fold 10']\n", "['2020-07-29 09', '51', '04,023', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '04,361', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '04,371', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '04,372', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '04,400', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '51', '04,406', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '51', '04,424', 'INFO', 'Finalizing model']\n", "['2020-07-29 09', '51', '04,475', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '51', '04,477', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=elbow, feature=None, label=False, save=True, system=False)']\n", "['2020-07-29 09', '51', '04,477', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '04,477', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '04,503', 'INFO', 'plot type', 'elbow']\n", "['2020-07-29 09', '51', '04,642', 'INFO', 'Fitting KElbowVisualizer()']\n", "['2020-07-29 09', '51', '04,861', 'INFO', 'Creating MLFlow logs']\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "['2020-07-29 09', '51', '05,101', 'INFO', 'mlflow==1.8.0']\n", "['2020-07-29 09', '51', '05,102', 'INFO', 'Checking Exceptions']\n", "['2020-07-29 09', '51', '05,449', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '51', '05,450', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '51', '05,452', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '51', '05,452', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '51', '05,498', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '51', '05,521', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", "['2020-07-29 09', '51', '05,522', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '05,522', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '51', '05,602', 'INFO', 'Uploading results into container']\n", "['2020-07-29 09', '51', '05,602', 'INFO', 'Uploading model into container']\n", "['2020-07-29 09', '51', '05,602', 'INFO', 'create_model_container', '5']\n", "['2020-07-29 09', '51', '05,603', 'INFO', 'master_model_container', '5']\n", "['2020-07-29 09', '51', '05,603', 'INFO', 'display_container', '6']\n", "['2020-07-29 09', '51', '05,605', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", "['2020-07-29 09', '51', '05,606', 'INFO', 'create_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '05,606', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '51', '05,606', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=True)']\n", "['2020-07-29 09', '51', '05,607', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '05,607', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '05,607', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '05,637', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '51', '05,638', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '05,641', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '51', '05,641', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '51', '05,642', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", "['2020-07-29 09', '51', '05,643', 'INFO', 'Checking ensemble method']\n", "['2020-07-29 09', '51', '05,645', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '51', '05,651', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '05,963', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '05,971', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '05,971', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '05,997', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '51', '06,002', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '06,313', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '06,321', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '06,322', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '06,345', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '51', '06,349', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '06,432', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '51', '06,700', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '06,708', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '06,709', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '06,740', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '51', '06,744', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '07,071', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '07,080', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '07,080', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '07,101', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '51', '07,106', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '07,403', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '07,411', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '07,411', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '07,438', 'INFO', 'Initializing Fold 6']\n", "['2020-07-29 09', '51', '07,443', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '07,767', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '07,781', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '07,782', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '07,808', 'INFO', 'Initializing Fold 7']\n", "['2020-07-29 09', '51', '07,813', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '08,123', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '08,170', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '08,179', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '08,180', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '08,189', 'INFO', \"Saving 'Elbow.png' in current active directory\"]\n", "['2020-07-29 09', '51', '08,189', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '08,189', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '08,207', 'INFO', 'Initializing Fold 8']\n", "['2020-07-29 09', '51', '08,211', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '08,234', 'INFO', 'SubProcess plot_model() end ==================================']\n", "['2020-07-29 09', '51', '08,234', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '51', '08,234', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '51', '08,236', 'INFO', \"save_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '51', '08,236', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '51', '08,262', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '51', '08,273', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '08,285', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "[\"verbose=False), KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0)]']\n", "['2020-07-29 09', '51', '08,285', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '08,285', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '51', '08,344', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '08,344', 'INFO', 'Declaring global variables']\n", "['2020-07-29 09', '51', '08,345', 'INFO', 'Input provided', 'dataframe']\n", "['2020-07-29 09', '51', '08,345', 'INFO', 'session_id set to', '123']\n", "['2020-07-29 09', '51', '08,347', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '51', '08,351', 'INFO', 'Importing stopwords from nltk']\n", "['2020-07-29 09', '51', '08,398', 'INFO', \"KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0)']\n", "['2020-07-29 09', '51', '08,399', 'INFO', 'create_models() succesfully completed......................................']\n", "['2020-07-29 09', '51', '08,419', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '51', '08,419', 'INFO', 'create_model(model=kmodes, num_clusters=4, ground_truth=None, verbose=True, system=True)']\n", "['2020-07-29 09', '51', '08,419', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '08,420', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '08,421', 'INFO', 'Setting num_cluster param']\n", "['2020-07-29 09', '51', '08,421', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '08,484', 'INFO', 'Importing untrained model']\n", "['2020-07-29 09', '51', '08,493', 'INFO', 'K-Modes Clustering Imported succesfully']\n", "['2020-07-29 09', '51', '08,516', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '08,689', 'INFO', 'No custom stopwords defined']\n", "['2020-07-29 09', '51', '08,692', 'INFO', 'Removing numeric characters from the text']\n", "['2020-07-29 09', '51', '10,128', 'INFO', 'Removing special characters from the text']\n", "['2020-07-29 09', '51', '14,072', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '14,083', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '14,083', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '14,112', 'INFO', 'Initializing Fold 9']\n", "['2020-07-29 09', '51', '14,120', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '14,712', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '14,721', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '14,722', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '14,747', 'INFO', 'Initializing Fold 10']\n", "['2020-07-29 09', '51', '14,751', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '15,185', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '15,195', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '15,196', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '15,225', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '51', '15,233', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '51', '15,250', 'INFO', 'Finalizing model']\n", "['2020-07-29 09', '51', '15,429', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '15,460', 'INFO', 'Creating Metrics dataframe']\n", "['2020-07-29 09', '51', '15,467', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '51', '15,686', 'INFO', 'SubProcess plot_model() called ==================================']\n", "['2020-07-29 09', '51', '15,687', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '51', '15,687', 'INFO', \"plot_model(model=KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0), plot=cluster, feature=None, label=False, save=True, system=False)']\n", "['2020-07-29 09', '51', '15,687', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '15,687', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '15,712', 'INFO', 'plot type', 'cluster']\n", "['2020-07-29 09', '51', '15,712', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '51', '15,712', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '51', '15,714', 'INFO', \"assign_model(model=KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0), transformation=True, verbose=False)']\n", "['2020-07-29 09', '51', '15,714', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '15,714', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '15,714', 'INFO', 'Copying data']\n", "['2020-07-29 09', '51', '15,715', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", "['2020-07-29 09', '51', '15,715', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '15,750', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '51', '15,751', 'INFO', 'Trained Model', 'K-Modes Clustering']\n", "['2020-07-29 09', '51', '15,752', 'INFO', '(224, 21)']\n", "['2020-07-29 09', '51', '15,752', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '15,753', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '51', '15,768', 'INFO', 'Fitting PCA()']\n", "['2020-07-29 09', '51', '15,785', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '51', '15,791', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '51', '15,848', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '51', '16,197', 'INFO', \"Saving 'Cluster.html' in current active directory\"]\n", "['2020-07-29 09', '51', '16,197', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '16,198', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '16,439', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '51', '16,439', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '51', '16,441', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '51', '16,441', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '51', '16,481', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '51', '16,508', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", "['2020-07-29 09', '51', '16,508', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '16,508', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '51', '16,609', 'INFO', 'Uploading results into container']\n", "['2020-07-29 09', '51', '16,609', 'INFO', 'Uploading model into container']\n", "['2020-07-29 09', '51', '16,610', 'INFO', 'create_model_container', '6']\n", "['2020-07-29 09', '51', '16,610', 'INFO', 'master_model_container', '6']\n", "['2020-07-29 09', '51', '16,610', 'INFO', 'display_container', '7']\n", "['2020-07-29 09', '51', '16,612', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", "['2020-07-29 09', '51', '16,612', 'INFO', 'create_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '16,613', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '51', '16,613', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=True)']\n", "['2020-07-29 09', '51', '16,613', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '16,613', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '16,613', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '16,641', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '51', '16,642', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '16,644', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '51', '16,645', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '51', '16,646', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", "['2020-07-29 09', '51', '16,648', 'INFO', 'Checking ensemble method']\n", "['2020-07-29 09', '51', '16,650', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '51', '16,655', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '16,986', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '16,996', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '16,996', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '17,026', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '51', '17,032', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '17,396', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '17,407', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '17,407', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '17,433', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '51', '17,438', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '17,523', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '51', '17,525', 'INFO', \"plot_model(model=KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0), plot=distribution, feature=None, label=False, save=True, system=False)']\n", "['2020-07-29 09', '51', '17,525', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '17,525', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '17,550', 'INFO', 'plot type', 'distribution']\n", "['2020-07-29 09', '51', '17,550', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '51', '17,551', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '51', '17,552', 'INFO', \"assign_model(model=KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0), transformation=False, verbose=False)']\n", "['2020-07-29 09', '51', '17,553', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '17,553', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '17,553', 'INFO', 'Copying data']\n", "['2020-07-29 09', '51', '17,554', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '17,595', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '51', '17,597', 'INFO', 'Trained Model', 'K-Modes Clustering']\n", "['2020-07-29 09', '51', '17,597', 'INFO', '(224, 22)']\n", "['2020-07-29 09', '51', '17,597', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '17,598', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '51', '17,598', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '51', '17,611', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '51', '17,786', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '17,795', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '17,795', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '17,822', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '51', '17,828', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '18,047', 'INFO', 'Tokenizing Words']\n", "['2020-07-29 09', '51', '18,251', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '18,259', 'INFO', \"Saving 'Distribution.html' in current active directory\"]\n", "['2020-07-29 09', '51', '18,259', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '18,259', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '18,259', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '18,261', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '18,286', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '51', '18,290', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '18,650', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '18,657', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '18,658', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '18,680', 'INFO', 'Initializing Fold 6']\n", "['2020-07-29 09', '51', '18,685', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '19,010', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '19,019', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '19,019', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '19,041', 'INFO', 'Initializing Fold 7']\n", "['2020-07-29 09', '51', '19,046', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '19,353', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '19,361', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '19,361', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '19,383', 'INFO', 'Initializing Fold 8']\n", "['2020-07-29 09', '51', '19,387', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '19,654', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '51', '19,655', 'INFO', \"plot_model(model=KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0), plot=elbow, feature=None, label=False, save=True, system=False)']\n", "['2020-07-29 09', '51', '19,656', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '19,656', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '19,680', 'INFO', 'plot type', 'elbow']\n", "['2020-07-29 09', '51', '19,722', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '19,743', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '19,744', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '19,776', 'INFO', 'Fitting KElbowVisualizer()']\n", "['2020-07-29 09', '51', '19,780', 'INFO', 'Initializing Fold 9']\n", "['2020-07-29 09', '51', '19,789', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '20,182', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '20,190', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '20,191', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '20,218', 'INFO', 'Initializing Fold 10']\n", "['2020-07-29 09', '51', '20,223', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '20,568', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '20,579', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '20,579', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '20,608', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '51', '20,614', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '51', '20,633', 'INFO', 'Finalizing model']\n", "['2020-07-29 09', '51', '20,990', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '51', '21,496', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '51', '21,496', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '51', '21,498', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '51', '21,498', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '51', '21,545', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '51', '21,572', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", "['2020-07-29 09', '51', '21,572', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '21,572', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '51', '21,660', 'INFO', 'Uploading results into container']\n", "['2020-07-29 09', '51', '21,660', 'INFO', 'Uploading model into container']\n", "['2020-07-29 09', '51', '21,660', 'INFO', 'create_model_container', '7']\n", "['2020-07-29 09', '51', '21,661', 'INFO', 'master_model_container', '7']\n", "['2020-07-29 09', '51', '21,661', 'INFO', 'display_container', '8']\n", "['2020-07-29 09', '51', '21,663', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", "['2020-07-29 09', '51', '21,663', 'INFO', 'create_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '21,664', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '51', '21,664', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=True)']\n", "['2020-07-29 09', '51', '21,664', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '21,664', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '21,664', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '21,704', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '51', '21,705', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '21,707', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '51', '21,707', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '51', '21,708', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", "['2020-07-29 09', '51', '21,711', 'INFO', 'Checking ensemble method']\n", "['2020-07-29 09', '51', '21,714', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '51', '21,719', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '22,073', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '22,082', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '22,082', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '22,110', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '51', '22,114', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '22,485', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '22,494', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '22,495', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '22,521', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '51', '22,526', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '22,854', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '22,863', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '22,863', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '22,886', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '51', '22,892', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '23,201', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '23,209', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '23,209', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '23,234', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '51', '23,239', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '23,566', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '23,577', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '23,578', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '23,604', 'INFO', 'Initializing Fold 6']\n", "['2020-07-29 09', '51', '23,609', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '24,001', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '24,010', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '24,011', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '24,039', 'INFO', 'Initializing Fold 7']\n", "['2020-07-29 09', '51', '24,045', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '24,458', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '24,469', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '24,470', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '24,497', 'INFO', 'Initializing Fold 8']\n", "['2020-07-29 09', '51', '24,502', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '24,843', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '24,854', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '24,855', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '24,878', 'INFO', 'Initializing Fold 9']\n", "['2020-07-29 09', '51', '24,883', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '25,229', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '25,237', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '25,238', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '25,260', 'INFO', 'Initializing Fold 10']\n", "['2020-07-29 09', '51', '25,264', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '25,610', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '25,619', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '25,620', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '25,649', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '51', '25,654', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '51', '25,676', 'INFO', 'Finalizing model']\n", "['2020-07-29 09', '51', '26,031', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '51', '26,558', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '51', '26,558', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '51', '26,560', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '51', '26,561', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '51', '26,610', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '51', '26,641', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", "['2020-07-29 09', '51', '26,641', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '26,641', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '51', '26,727', 'INFO', 'Uploading results into container']\n", "['2020-07-29 09', '51', '26,728', 'INFO', 'Uploading model into container']\n", "['2020-07-29 09', '51', '26,728', 'INFO', 'create_model_container', '8']\n", "['2020-07-29 09', '51', '26,728', 'INFO', 'master_model_container', '8']\n", "['2020-07-29 09', '51', '26,728', 'INFO', 'display_container', '9']\n", "['2020-07-29 09', '51', '26,729', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", "['2020-07-29 09', '51', '26,729', 'INFO', 'create_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '26,730', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '51', '26,730', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=True)']\n", "['2020-07-29 09', '51', '26,730', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '26,730', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '26,730', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '26,757', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '51', '26,758', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '26,761', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '51', '26,761', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '51', '26,762', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", "['2020-07-29 09', '51', '26,765', 'INFO', 'Checking ensemble method']\n", "['2020-07-29 09', '51', '26,767', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '51', '26,772', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '27,137', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '27,145', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '27,146', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '27,180', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '51', '27,185', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '27,525', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '27,537', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '27,537', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '27,568', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '51', '27,574', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '27,918', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '27,927', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '27,927', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '27,957', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '51', '27,964', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '28,283', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '28,292', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '28,292', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '28,317', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '51', '28,323', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '28,657', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '28,666', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '28,667', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '28,694', 'INFO', 'Initializing Fold 6']\n", "['2020-07-29 09', '51', '28,698', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '29,025', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '29,033', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '29,033', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '29,060', 'INFO', 'Initializing Fold 7']\n", "['2020-07-29 09', '51', '29,064', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '29,407', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '29,418', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '29,418', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '29,447', 'INFO', 'Initializing Fold 8']\n", "['2020-07-29 09', '51', '29,454', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '29,799', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '29,810', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '29,810', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '29,839', 'INFO', 'Initializing Fold 9']\n", "['2020-07-29 09', '51', '29,845', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '30,163', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '30,170', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '30,171', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '30,197', 'INFO', 'Initializing Fold 10']\n", "['2020-07-29 09', '51', '30,202', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '30,523', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '30,533', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '30,533', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '30,559', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '51', '30,562', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '51', '30,580', 'INFO', 'Finalizing model']\n", "['2020-07-29 09', '51', '30,932', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '51', '31,478', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '51', '31,479', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '51', '31,481', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '51', '31,481', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '51', '31,512', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '51', '31,536', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", "['2020-07-29 09', '51', '31,536', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '31,536', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '51', '31,619', 'INFO', 'Uploading results into container']\n", "['2020-07-29 09', '51', '31,620', 'INFO', 'Uploading model into container']\n", "['2020-07-29 09', '51', '31,620', 'INFO', 'create_model_container', '9']\n", "['2020-07-29 09', '51', '31,620', 'INFO', 'master_model_container', '9']\n", "['2020-07-29 09', '51', '31,620', 'INFO', 'display_container', '10']\n", "['2020-07-29 09', '51', '31,622', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", "['2020-07-29 09', '51', '31,623', 'INFO', 'create_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '31,623', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '51', '31,624', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=True)']\n", "['2020-07-29 09', '51', '31,624', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '31,624', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '31,624', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '31,656', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '51', '31,658', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '31,660', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '51', '31,661', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '51', '31,662', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", "['2020-07-29 09', '51', '31,664', 'INFO', 'Checking ensemble method']\n", "['2020-07-29 09', '51', '31,667', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '51', '31,672', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '32,036', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '32,044', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '32,044', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '32,068', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '51', '32,073', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '32,380', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '32,391', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '32,391', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '32,418', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '51', '32,423', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '32,741', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '32,749', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '32,750', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '32,774', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '51', '32,779', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '33,089', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '33,096', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '33,096', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '33,122', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '51', '33,127', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '33,448', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '33,456', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '33,456', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '33,478', 'INFO', 'Initializing Fold 6']\n", "['2020-07-29 09', '51', '33,482', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '33,801', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '33,811', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '33,812', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '33,838', 'INFO', 'Initializing Fold 7']\n", "['2020-07-29 09', '51', '33,843', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '33,875', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '51', '34,159', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '34,168', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '34,168', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '34,193', 'INFO', 'Initializing Fold 8']\n", "['2020-07-29 09', '51', '34,198', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '34,434', 'INFO', \"Saving 'Elbow.png' in current active directory\"]\n", "['2020-07-29 09', '51', '34,435', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '34,435', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '34,471', 'INFO', 'SubProcess plot_model() end ==================================']\n", "['2020-07-29 09', '51', '34,472', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '51', '34,472', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '51', '34,473', 'INFO', \"save_model(model=KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '51', '34,473', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '51', '34,506', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '34,514', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '34,514', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '34,537', 'INFO', 'Initializing Fold 9']\n", "['2020-07-29 09', '51', '34,542', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '34,842', 'INFO', 'Removing stopwords']\n", "['2020-07-29 09', '51', '34,868', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '34,879', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '34,880', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '34,904', 'INFO', 'Initializing Fold 10']\n", "['2020-07-29 09', '51', '34,909', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '35,141', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '51', '35,166', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "[\"verbose=False), KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0)]']\n", "['2020-07-29 09', '51', '35,166', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '35,167', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '51', '35,226', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '35,245', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '35,246', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '35,271', 'INFO', \"KModes(cat_dissim=, init='Cao',\"]\n", "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", "['verbose=0)']\n", "['2020-07-29 09', '51', '35,272', 'INFO', 'create_models() succesfully completed......................................']\n", "['2020-07-29 09', '51', '35,275', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '51', '35,280', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '51', '35,295', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '51', '35,297', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=False, verbose=True)']\n", "['2020-07-29 09', '51', '35,297', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '35,298', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '35,298', 'INFO', 'Copying data']\n", "['2020-07-29 09', '51', '35,299', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '35,300', 'INFO', 'Finalizing model']\n", "['2020-07-29 09', '51', '35,373', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '51', '35,375', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '51', '35,378', 'INFO', '(224, 22)']\n", "['2020-07-29 09', '51', '35,378', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '35,468', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '51', '35,470', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=cluster, feature=None, label=False, save=False, system=True)']\n", "['2020-07-29 09', '51', '35,470', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '35,470', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '35,494', 'INFO', 'plot type', 'cluster']\n", "['2020-07-29 09', '51', '35,494', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '51', '35,494', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '51', '35,496', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", "['2020-07-29 09', '51', '35,496', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '35,496', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '35,496', 'INFO', 'Copying data']\n", "['2020-07-29 09', '51', '35,497', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", "['2020-07-29 09', '51', '35,497', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '35,530', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '51', '35,532', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '51', '35,533', 'INFO', '(224, 21)']\n", "['2020-07-29 09', '51', '35,533', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '35,534', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '51', '35,549', 'INFO', 'Fitting PCA()']\n", "['2020-07-29 09', '51', '35,565', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '51', '35,570', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '51', '35,796', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '35,796', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '35,812', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '51', '35,813', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=cluster, feature=Country Name, label=True, save=False, system=True)']\n", "['2020-07-29 09', '51', '35,814', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '35,814', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '35,840', 'INFO', 'plot type', 'cluster']\n", "['2020-07-29 09', '51', '35,841', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '51', '35,841', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '51', '35,842', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", "['2020-07-29 09', '51', '35,842', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '35,843', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '35,843', 'INFO', 'Copying data']\n", "['2020-07-29 09', '51', '35,844', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", "['2020-07-29 09', '51', '35,844', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '35,878', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '51', '35,880', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '51', '35,880', 'INFO', '(224, 21)']\n", "['2020-07-29 09', '51', '35,881', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '35,881', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '51', '35,897', 'INFO', 'Fitting PCA()']\n", "['2020-07-29 09', '51', '35,916', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '51', '35,923', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '51', '36,095', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '51', '36,190', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '36,190', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '36,205', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '51', '36,206', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=tsne, feature=None, label=False, save=False, system=True)']\n", "['2020-07-29 09', '51', '36,207', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '36,207', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '36,240', 'INFO', 'plot type', 'tsne']\n", "['2020-07-29 09', '51', '36,240', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '51', '36,240', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '51', '36,242', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", "['2020-07-29 09', '51', '36,242', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '36,243', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '36,243', 'INFO', 'Copying data']\n", "['2020-07-29 09', '51', '36,244', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", "['2020-07-29 09', '51', '36,244', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '36,287', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '51', '36,289', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '51', '36,289', 'INFO', '(224, 21)']\n", "['2020-07-29 09', '51', '36,290', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '36,290', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '51', '36,294', 'INFO', 'Fitting TSNE()']\n", "['2020-07-29 09', '51', '36,736', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '51', '36,737', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '51', '36,739', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '51', '36,739', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '51', '36,784', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '51', '36,809', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", "['2020-07-29 09', '51', '36,809', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '36,810', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '51', '36,901', 'INFO', 'Uploading results into container']\n", "['2020-07-29 09', '51', '36,901', 'INFO', 'Uploading model into container']\n", "['2020-07-29 09', '51', '36,901', 'INFO', 'create_model_container', '10']\n", "['2020-07-29 09', '51', '36,901', 'INFO', 'master_model_container', '10']\n", "['2020-07-29 09', '51', '36,902', 'INFO', 'display_container', '11']\n", "['2020-07-29 09', '51', '36,903', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", "['2020-07-29 09', '51', '36,904', 'INFO', 'create_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '36,904', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '51', '36,904', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=True)']\n", "['2020-07-29 09', '51', '36,905', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '36,905', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '36,905', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '36,943', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '51', '36,944', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '36,947', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '51', '36,948', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '51', '36,949', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", "['2020-07-29 09', '51', '36,952', 'INFO', 'Checking ensemble method']\n", "['2020-07-29 09', '51', '36,954', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '51', '36,958', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '37,684', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '37,692', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '37,692', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '37,716', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '51', '37,721', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '38,429', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '38,437', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '38,437', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '38,460', 'INFO', 'Initializing Fold 3']\n", "['2020-07-29 09', '51', '38,464', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '39,178', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '39,186', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '39,186', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '39,210', 'INFO', 'Initializing Fold 4']\n", "['2020-07-29 09', '51', '39,215', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '39,960', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '39,968', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '39,968', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '39,992', 'INFO', 'Initializing Fold 5']\n", "['2020-07-29 09', '51', '39,997', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '40,712', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '40,720', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '40,720', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '40,743', 'INFO', 'Initializing Fold 6']\n", "['2020-07-29 09', '51', '40,748', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '41,445', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '41,454', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '41,454', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '41,478', 'INFO', 'Initializing Fold 7']\n", "['2020-07-29 09', '51', '41,483', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '41,653', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '51', '41,659', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '51', '41,956', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '41,965', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '41,965', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '41,967', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '41,967', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '41,981', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '51', '41,982', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=elbow, feature=None, label=False, save=False, system=True)']\n", "['2020-07-29 09', '51', '41,983', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '41,984', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '41,994', 'INFO', 'Initializing Fold 8']\n", "['2020-07-29 09', '51', '41,997', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '42,027', 'INFO', 'plot type', 'elbow']\n", "['2020-07-29 09', '51', '42,028', 'INFO', 'Fitting KElbowVisualizer()']\n", "['2020-07-29 09', '51', '42,381', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '42,393', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '42,394', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '42,420', 'INFO', 'Initializing Fold 9']\n", "['2020-07-29 09', '51', '42,425', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '42,790', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '42,799', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '42,799', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '42,822', 'INFO', 'Initializing Fold 10']\n", "['2020-07-29 09', '51', '42,827', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '43,263', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '43,283', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '43,284', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '43,307', 'INFO', 'Calculating mean and std']\n", "['2020-07-29 09', '51', '43,311', 'INFO', 'Creating metrics dataframe']\n", "['2020-07-29 09', '51', '43,331', 'INFO', 'Finalizing model']\n", "['2020-07-29 09', '51', '43,369', 'INFO', 'Extracting Bigrams']\n", "['2020-07-29 09', '51', '43,937', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '51', '43,967', 'INFO', 'Creating MLFlow logs']\n", "['2020-07-29 09', '51', '44,615', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '51', '44,615', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '51', '44,617', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", "['2020-07-29 09', '51', '44,618', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '51', '44,634', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '44,635', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '44,650', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '51', '44,652', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=silhouette, feature=None, label=False, save=False, system=True)']\n", "['2020-07-29 09', '51', '44,656', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '44,656', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '44,669', 'INFO', 'Trained Model.pkl saved in current working directory']\n", "['2020-07-29 09', '51', '44,688', 'INFO', 'plot type', 'silhouette']\n", "['2020-07-29 09', '51', '44,689', 'INFO', 'Fitting SilhouetteVisualizer()']\n", "['2020-07-29 09', '51', '44,701', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True, features_todrop=[],']\n", "[\"ml_usecase='regression',\"]\n", "[\"numerical_features=[], target='charges',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_Catagorical_Levels...']\n", "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", "['2020-07-29 09', '51', '44,701', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '44,701', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '51', '44,794', 'INFO', 'Uploading results into container']\n", "['2020-07-29 09', '51', '44,794', 'INFO', 'Uploading model into container']\n", "['2020-07-29 09', '51', '44,795', 'INFO', 'create_model_container', '11']\n", "['2020-07-29 09', '51', '44,795', 'INFO', 'master_model_container', '11']\n", "['2020-07-29 09', '51', '44,795', 'INFO', 'display_container', '12']\n", "['2020-07-29 09', '51', '44,798', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", "['2020-07-29 09', '51', '44,798', 'INFO', 'create_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '44,800', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '51', '44,906', 'INFO', 'Initializing create_model()']\n", "['2020-07-29 09', '51', '44,908', 'INFO', \"create_model(estimator=ExplainableBoostingRegressor(binning='quantile', early_stopping_rounds=50,\"]\n", "['early_stopping_tolerance=0, feature_names=None,']\n", "['feature_types=None, inner_bags=0, interactions=0,']\n", "[\"learning_rate=0.01, mains='all', max_bins=255,\"]\n", "['max_leaves=3, max_rounds=5000, min_samples_leaf=2,']\n", "['n_jobs=-2, outer_bags=16, random_state=42,']\n", "['validation_size=0.15), ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", "['2020-07-29 09', '51', '44,909', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '44,909', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '44,909', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '45,006', 'INFO', 'Copying training dataset']\n", "['2020-07-29 09', '51', '45,008', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '45,011', 'INFO', 'Defining folds']\n", "['2020-07-29 09', '51', '45,012', 'INFO', 'Declaring metric variables']\n", "['2020-07-29 09', '51', '45,033', 'INFO', 'Declaring custom model']\n", "['2020-07-29 09', '51', '45,035', 'INFO', 'ExplainableBoostingRegressor Imported succesfully']\n", "['2020-07-29 09', '51', '45,039', 'INFO', 'Checking ensemble method']\n", "['2020-07-29 09', '51', '45,060', 'INFO', 'Initializing Fold 1']\n", "['2020-07-29 09', '51', '45,083', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '45,326', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '45,327', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '45,342', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '51', '45,344', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=distance, feature=None, label=False, save=False, system=True)']\n", "['2020-07-29 09', '51', '45,344', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '45,345', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '45,377', 'INFO', 'plot type', 'distance']\n", "['2020-07-29 09', '51', '45,487', 'INFO', 'Fitting InterclusterDistance()']\n", "['2020-07-29 09', '51', '45,564', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '51', '46,194', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '46,194', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '46,209', 'INFO', 'Initializing plot_model()']\n", "['2020-07-29 09', '51', '46,212', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), plot=distribution, feature=None, label=False, save=False, system=True)']\n", "['2020-07-29 09', '51', '46,212', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '46,213', 'INFO', 'Importing libraries']\n", "['2020-07-29 09', '51', '46,239', 'INFO', 'plot type', 'distribution']\n", "['2020-07-29 09', '51', '46,240', 'INFO', 'SubProcess assign_model() called ==================================']\n", "['2020-07-29 09', '51', '46,240', 'INFO', 'Initializing assign_model()']\n", "['2020-07-29 09', '51', '46,242', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), transformation=False, verbose=False)']\n", "['2020-07-29 09', '51', '46,242', 'INFO', 'Checking exceptions']\n", "['2020-07-29 09', '51', '46,243', 'INFO', 'Preloading libraries']\n", "['2020-07-29 09', '51', '46,243', 'INFO', 'Copying data']\n", "['2020-07-29 09', '51', '46,244', 'INFO', 'Preparing display monitor']\n", "['2020-07-29 09', '51', '46,295', 'INFO', 'Determining Trained Model']\n", "['2020-07-29 09', '51', '46,297', 'INFO', 'Trained Model', 'K-Means Clustering']\n", "['2020-07-29 09', '51', '46,297', 'INFO', '(224, 22)']\n", "['2020-07-29 09', '51', '46,297', 'INFO', 'assign_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '46,298', 'INFO', 'SubProcess assign_model() end ==================================']\n", "['2020-07-29 09', '51', '46,298', 'INFO', 'Sorting dataframe']\n", "['2020-07-29 09', '51', '46,312', 'INFO', 'Rendering Visual']\n", "['2020-07-29 09', '51', '46,914', 'INFO', 'Visual Rendered Successfully']\n", "['2020-07-29 09', '51', '46,914', 'INFO', 'plot_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '47,206', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '51', '47,208', 'INFO', \"save_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), model_name=kmeans, verbose=True)']\n", "['2020-07-29 09', '51', '47,209', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '51', '47,243', 'INFO', 'kmeans.pkl saved in current working directory']\n", "['2020-07-29 09', '51', '47,273', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "[\"verbose=False), KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0)]']\n", "['2020-07-29 09', '51', '47,275', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '47,520', 'INFO', 'Initializing deploy_model()']\n", "['2020-07-29 09', '51', '47,522', 'INFO', \"deploy_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "[\"random_state=123, tol=0.0001, verbose=0), model_name=kmeans-aws, authentication={'bucket'\", \"'pycaret-test'}, platform=aws)\"]\n", "['2020-07-29 09', '51', '47,522', 'INFO', 'Platform', 'AWS S3']\n", "['2020-07-29 09', '51', '49,570', 'INFO', 'Saving model in current working directory']\n", "['2020-07-29 09', '51', '49,571', 'INFO', 'SubProcess save_model() called ==================================']\n", "['2020-07-29 09', '51', '49,571', 'INFO', 'Initializing save_model()']\n", "['2020-07-29 09', '51', '49,573', 'INFO', \"save_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0), model_name=kmeans-aws, verbose=False)']\n", "['2020-07-29 09', '51', '49,574', 'INFO', 'Appending prep pipeline']\n", "['2020-07-29 09', '51', '49,638', 'INFO', 'kmeans-aws.pkl saved in current working directory']\n", "['2020-07-29 09', '51', '49,661', 'INFO', '[Pipeline(memory=None,']\n", "[\"steps=[('dtypes',\"]\n", "['DataTypes_Auto_infer(categorical_features=[],']\n", "['display_types=True,']\n", "[\"features_todrop=['Country Name'],\"]\n", "[\"ml_usecase='regression',\"]\n", "['numerical_features=[],']\n", "[\"target='dummy_target',\"]\n", "['time_features=[])),']\n", "[\"('imputer',\"]\n", "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", "[\"numeric_strategy='mean',\"]\n", "['target_variable=None)),']\n", "[\"('new_levels1',\"]\n", "['New_...']\n", "[\"target='dummy_target')),\"]\n", "[\"('feature_time',\"]\n", "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", "[\"('group', Empty()), ('scaling', Empty()),\"]\n", "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", "[\"('dummy', Dummify(target='dummy_target')),\"]\n", "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", "[\"('pca', Empty())],\"]\n", "[\"verbose=False), KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0)]']\n", "['2020-07-29 09', '51', '49,661', 'INFO', 'save_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '49,661', 'INFO', 'SubProcess save_model() end ==================================']\n", "['2020-07-29 09', '51', '49,661', 'INFO', 'Initializing S3 client']\n", "['2020-07-29 09', '51', '51,288', 'INFO', 'Evaluating Metrics']\n", "['2020-07-29 09', '51', '51,296', 'INFO', 'No inverse transformation']\n", "['2020-07-29 09', '51', '51,296', 'INFO', 'Compiling Metrics']\n", "['2020-07-29 09', '51', '51,340', 'INFO', \"KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", "['random_state=123, tol=0.0001, verbose=0)']\n", "['2020-07-29 09', '51', '51,340', 'INFO', 'deploy_model() succesfully completed......................................']\n", "['2020-07-29 09', '51', '51,362', 'INFO', 'Initializing get_config()']\n", "['2020-07-29 09', '51', '51,363', 'INFO', 'get_config(variable=X)']\n", "['2020-07-29 09', '51', '51,363', 'INFO', 'Global variable', 'X returned']\n", "['2020-07-29 09', '51', '51,364', 'INFO', 'get_config() succesfully completed......................................']\n", "['2020-07-29 09', '51', '51,382', 'INFO', 'Initializing Fold 2']\n", "['2020-07-29 09', '51', '51,410', 'INFO', 'Fitting Model']\n", "['2020-07-29 09', '51', '51,471', 'INFO', 'Initializing get_config()']\n", "['2020-07-29 09', '51', '51,472', 'INFO', 'get_config(variable=seed)']\n", "['2020-07-29 09', '51', '51,472', 'INFO', 'Global variable', 'seed returned']\n", "['2020-07-29 09', '51', '51,472', 'INFO', 'get_config() succesfully completed......................................']\n", "['2020-07-29 09', '51', '51,496', 'INFO', 'Initializing set_config()']\n", "['2020-07-29 09', '51', '51,496', 'INFO', 'set_config(variable=seed, value=999)']\n", "['2020-07-29 09', '51', '51,497', 'INFO', 'Global variable', 'seed updated']\n", "['2020-07-29 09', '51', '51,497', 'INFO', 'set_config() succesfully completed......................................']\n", "['2020-07-29 09', '51', '51,566', 'INFO', 'Initializing get_config()']\n", "['2020-07-29 09', '51', '51,567', 'INFO', 'get_config(variable=seed)']\n", "['2020-07-29 09', '51', '51,567', 'INFO', 'Global variable', 'seed returned']\n", "['2020-07-29 09', '51', '51,567', 'INFO', 'get_config() succesfully completed......................................']\n" ] } ], "source": [ "get_system_logs()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 11. MLFlow UI" ] }, { "cell_type": "code", "execution_count": 26, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "Running the mlflow server failed. Please see the logs above for details.\n" ] } ], "source": [ "!mlflow ui" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# End\n", "Thank you. For more information / tutorials on PyCaret, please visit https://www.pycaret.org" ] } ], "metadata": { "kernelspec": { "display_name": "pycaret-nightly-env", "language": "python", "name": "pycaret-nightly-env" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.10" } }, "nbformat": 4, "nbformat_minor": 2 }