{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {
    "scrolled": false
   },
   "outputs": [],
   "source": [
    "# If installed from pip, import lostruct as ls will work\n",
    "import lostruct.lostruct as ls\n",
    "\n",
    "# PCoA from skbio.stats is the best implementation of R's MDS algorithm\n",
    "from skbio.stats.ordination import pcoa\n",
    "\n",
    "# Much of the output from CyVCF2 and lostruct are numpy arrays\n",
    "import numpy as np\n",
    "\n",
    "import pandas as pd\n",
    "import plotly.express as px\n",
    "from sklearn.manifold import MDS\n",
    "import umap\n",
    "import hdbscan\n",
    "import plotly.io as pio\n",
    "pio.renderers.default = \"notebook_connected\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['HM017-I', 'HM018', 'HM022-I', 'HM029', 'HM030']"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Two VCF utility functions are proivded. get_samples() and get_landmarks()\n",
    "\n",
    "# This will be the same order of the resulting data\n",
    "samples = ls.get_samples(\"test_data/chr1-filtered.vcf.gz\")\n",
    "samples[0:5]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['chl_Mt', 'chr1', 'chr2', 'chr3', 'chr4']"
      ]
     },
     "execution_count": 17,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Utility function: Get list of landmarks (chromosome, scaffolds, contigs, etc..)\n",
    "landmarks = ls.get_landmarks(\"test_data/chr1-filtered.vcf.gz\")\n",
    "landmarks[0:5]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Help on function get_samples in module lostruct.lostruct:\n",
      "\n",
      "get_samples(vcf_file)\n",
      "    Get the samples from a VCF/BCF file. This is the order the data will remain in as well.\n",
      "\n"
     ]
    }
   ],
   "source": [
    "# Docstrings are also provided\n",
    "help(ls.get_samples)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/josephguhlin/anaconda3/envs/lostruct/lib/python3.8/site-packages/numpy/core/_asarray.py:136: VisibleDeprecationWarning:\n",
      "\n",
      "Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray\n",
      "\n"
     ]
    }
   ],
   "source": [
    "# Parse VCF to get windows and positions of each SNP within each window\n",
    "windows, positions = ls.parse_vcf(\"test_data/chr1-filtered.vcf.gz\", \"chr1\", 95, ls.Window.SNP)\n",
    "# ls.Window.SNP specifies window sizes are by SNP count. ls.Window.BP specifies windows are in base pair lengths.\n",
    "\n",
    "# *** ls.Window.BP is not yet implemented, however. ***\n",
    "# Please see: https://github.com/jguhlin/lostruct-py/issues/8\n",
    "\n",
    "# Accumulate output of eigen_windows\n",
    "result = list()\n",
    "for x in windows:\n",
    "    result.append(ls.eigen_windows(x, 10, 1))\n",
    "\n",
    "# Convert to numpy array\n",
    "result = np.vstack(result)\n",
    "\n",
    "# Get PCA distances comparison matrix\n",
    "pc_dists = ls.get_pc_dists(result)\n",
    "# An additional mode, fastmath, is available. Trading some accuracy for a slight speed boost (~8%)\n",
    "pc_dists = ls.get_pc_dists(result, fastmath=True)\n",
    "\n",
    "# Get PCoA value of pc_dists matrix (this is equivalent to R's MDS)\n",
    "# PLEASE NOTE: See section below: Working with Large Datasets\n",
    "# For recommended ways to run pcoa\n",
    "mds = pcoa(pc_dists)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "        <script type=\"text/javascript\">\n",
       "        window.PlotlyConfig = {MathJaxConfig: 'local'};\n",
       "        if (window.MathJax) {MathJax.Hub.Config({SVG: {font: \"STIX-Web\"}});}\n",
       "        if (typeof require !== 'undefined') {\n",
       "        require.undef(\"plotly\");\n",
       "        requirejs.config({\n",
       "            paths: {\n",
       "                'plotly': ['https://cdn.plot.ly/plotly-latest.min']\n",
       "            }\n",
       "        });\n",
       "        require(['plotly'], function(Plotly) {\n",
       "            window._Plotly = Plotly;\n",
       "        });\n",
       "        }\n",
       "        </script>\n",
       "        "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "<div>                            <div id=\"9bce9225-c1d2-49f8-81d8-e4bac3d0b5bc\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div>            <script type=\"text/javascript\">                require([\"plotly\"], function(Plotly) {                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById(\"9bce9225-c1d2-49f8-81d8-e4bac3d0b5bc\")) {                    Plotly.newPlot(                        \"9bce9225-c1d2-49f8-81d8-e4bac3d0b5bc\",                        [{\"hovertemplate\": \"x=%{x}<br>y=%{y}<extra></extra>\", \"legendgroup\": \"\", \"marker\": {\"color\": \"#636efa\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"\", \"orientation\": \"v\", \"showlegend\": false, \"type\": \"scatter\", \"x\": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123], \"xaxis\": \"x\", \"y\": [0.10328071630058908, 0.0650479248725926, -0.007394106598915255, -0.006157734405445993, 0.030486759245616054, -0.052697883748815746, -0.019532195114048374, 0.10731489173784366, -0.045747016700497425, 0.05232496900485219, -0.10842996248618392, -0.012932329719601952, 0.04630725443312959, 0.0713363949570614, 0.0232421287307101, -0.008386021663101888, -0.045461178095005314, 0.07517237748421035, 0.0332832653482144, -0.00464769930238915, 0.09244351798292504, 0.05328536847518314, -0.06764070547396611, 0.009697491880571245, 0.07316624137339647, 0.061255843644709575, 0.020300517750714276, -0.1421031649097082, 0.026228777140329878, -0.022514796338087593, -0.06052430046525878, -0.005638655371737583, -0.03789426904973051, -0.26128388065099417, -0.011435430763923492, -0.096027993633076, -0.051979100902621214, -0.019041092443677295, 0.014928264457918042, -0.045080298703791676, -0.02157385679489578, -0.07837639643185061, -0.0936522207464769, 0.02254911945685126, -0.0811184297826174, -0.06026163221142208, -0.06135711735706212, 0.05124176546518588, -0.11034190721868777, 0.04942027722185122, -0.006800316932454283, -0.0450365793277635, -0.002580493904349241, 0.047480809630117096, 0.018229051470887193, 0.015323735519900508, -0.10491699613058116, -0.010977527633032964, 0.02905633619543364, -0.10260878154655098, 0.0007373597967201738, -0.07676325094849808, -0.059763729316446274, 0.005978345010026969, 0.004451055073261316, 0.012649239195900166, 0.018363346197186534, -0.016892193247203768, -0.0018180681629584832, -0.09286617480763365, 0.051524449155064184, 0.07652275236295818, 0.05348911734730026, 0.013909413003526622, -0.015459045289710009, 0.017182337028950622, 0.10505052960021619, -0.0962579768450507, 0.020029323812104205, -0.0874099639144895, 0.03143331440415039, 0.03386962467646718, -0.0499833273717695, -0.03602212849884945, -0.002822801181295588, 0.00977488842740034, 0.01128253169722742, 0.07758374666886007, 0.06393887161447563, 0.0005884095034402356, 0.04086179301355499, -0.04464763191980178, 0.06865312112701832, 0.09193286524055753, -0.01748611026806448, 0.04763226317586455, 0.02756224580878249, -0.03907294771166091, -0.07896282387662465, -0.09588607288563603, 0.020648615068449123, 0.023385787148913286, -0.07791160503505776, 0.03903424756155953, 0.08748900720869043, 0.0648073951032875, 0.08733205456726416, -0.11932100052943416, 0.0009908575897407317, 0.06109398053549187, 0.12669016268582342, 0.057347209767974076, -0.08037714028084723, -0.007260718834142317, 0.053458225481735525, 0.0191608345738471, 0.08699909043651556, -0.002836034415763903, 0.055844193223345606, 0.020623667595681024, -0.029100731293872795, 0.04399736659910032, 0.03621915221245034, 0.07854695911145614], \"yaxis\": \"y\"}],                        {\"legend\": {\"tracegroupgap\": 0}, \"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2d\"}], \"histogram2dcontour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2dcontour\"}], \"mesh3d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"mesh3d\"}], \"parcoords\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"parcoords\"}], \"pie\": [{\"automargin\": true, \"type\": \"pie\"}], \"scatter\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter\"}], \"scatter3d\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter3d\"}], \"scattercarpet\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattercarpet\"}], \"scattergeo\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergeo\"}], \"scattergl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergl\"}], \"scattermapbox\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattermapbox\"}], \"scatterpolar\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolar\"}], \"scatterpolargl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolargl\"}], \"scatterternary\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterternary\"}], \"surface\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"surface\"}], \"table\": [{\"cells\": {\"fill\": {\"color\": \"#EBF0F8\"}, \"line\": {\"color\": \"white\"}}, \"header\": {\"fill\": {\"color\": \"#C8D4E3\"}, \"line\": {\"color\": \"white\"}}, \"type\": \"table\"}]}, \"layout\": {\"annotationdefaults\": {\"arrowcolor\": \"#2a3f5f\", \"arrowhead\": 0, \"arrowwidth\": 1}, \"coloraxis\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"colorscale\": {\"diverging\": [[0, \"#8e0152\"], [0.1, \"#c51b7d\"], [0.2, \"#de77ae\"], [0.3, \"#f1b6da\"], [0.4, \"#fde0ef\"], [0.5, \"#f7f7f7\"], [0.6, \"#e6f5d0\"], [0.7, \"#b8e186\"], [0.8, \"#7fbc41\"], [0.9, \"#4d9221\"], [1, \"#276419\"]], \"sequential\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"sequentialminus\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"colorway\": [\"#636efa\", \"#EF553B\", \"#00cc96\", \"#ab63fa\", \"#FFA15A\", \"#19d3f3\", \"#FF6692\", \"#B6E880\", \"#FF97FF\", \"#FECB52\"], \"font\": {\"color\": \"#2a3f5f\"}, \"geo\": {\"bgcolor\": \"white\", \"lakecolor\": \"white\", \"landcolor\": \"#E5ECF6\", \"showlakes\": true, \"showland\": true, \"subunitcolor\": \"white\"}, \"hoverlabel\": {\"align\": \"left\"}, \"hovermode\": \"closest\", \"mapbox\": {\"style\": \"light\"}, \"paper_bgcolor\": \"white\", \"plot_bgcolor\": \"#E5ECF6\", \"polar\": {\"angularaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"radialaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"scene\": {\"xaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"yaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"zaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}}, \"shapedefaults\": {\"line\": {\"color\": \"#2a3f5f\"}}, \"ternary\": {\"aaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"baxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"caxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"title\": {\"x\": 0.05}, \"xaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}, \"yaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}}}, \"title\": {\"text\": \"MDS Coordinate 1 (y-axis) compared to Window (x-axis)\"}, \"xaxis\": {\"anchor\": \"y\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"x\"}}, \"yaxis\": {\"anchor\": \"x\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"y\"}}},                        {\"responsive\": true}                    ).then(function(){\n",
       "                            \n",
       "var gd = document.getElementById('9bce9225-c1d2-49f8-81d8-e4bac3d0b5bc');\n",
       "var x = new MutationObserver(function (mutations, observer) {{\n",
       "        var display = window.getComputedStyle(gd).display;\n",
       "        if (!display || display === 'none') {{\n",
       "            console.log([gd, 'removed!']);\n",
       "            Plotly.purge(gd);\n",
       "            observer.disconnect();\n",
       "        }}\n",
       "}});\n",
       "\n",
       "// Listen for the removal of the full notebook cells\n",
       "var notebookContainer = gd.closest('#notebook-container');\n",
       "if (notebookContainer) {{\n",
       "    x.observe(notebookContainer, {childList: true});\n",
       "}}\n",
       "\n",
       "// Listen for the clearing of the current output cell\n",
       "var outputEl = gd.closest('.output');\n",
       "if (outputEl) {{\n",
       "    x.observe(outputEl, {childList: true});\n",
       "}}\n",
       "\n",
       "                        })                };                });            </script>        </div>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "px.scatter(y=mds.samples[\"PC1\"], title=\"MDS Coordinate 1 (y-axis) compared to Window (x-axis)\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>                            <div id=\"bb939446-0d81-463a-8a94-e74875edc9a9\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div>            <script type=\"text/javascript\">                require([\"plotly\"], function(Plotly) {                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById(\"bb939446-0d81-463a-8a94-e74875edc9a9\")) {                    Plotly.newPlot(                        \"bb939446-0d81-463a-8a94-e74875edc9a9\",                        [{\"hovertemplate\": \"x=%{x}<br>y=%{y}<extra></extra>\", \"legendgroup\": \"\", \"marker\": {\"color\": \"#636efa\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"\", \"orientation\": \"v\", \"showlegend\": false, \"type\": \"scatter\", \"x\": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123], \"xaxis\": \"x\", \"y\": [-0.0272889123126008, 0.07351808816163832, -0.04132701201880126, 0.04705603238535642, -0.02113906621000458, 0.07146387390284675, 0.12346131807694984, 0.0906331655558465, -0.06913438701795134, -0.019033738812695343, -0.009471983657167974, 0.06193898688026216, 0.07292036158608256, 0.06578754224807705, -0.0006577184845889437, 0.02676760841256399, 0.06289571245250154, -0.0015655315805959027, -0.003325879143097108, 0.14853896740085593, 0.004299589543028834, 0.035664904018845735, -0.0026343055625691956, -0.05192972049451219, 0.02153884019443099, -0.019578707469464742, 0.09156186207991591, 0.044279755771083056, 0.11822415906969197, -0.12082079553854412, 0.06030770413311747, -0.01402836703417489, 0.11709651469176459, -0.042797266550502165, -0.058508135416571974, -0.0976076240109346, 0.02891813010324901, 0.026561925020731382, -0.0237270482546584, 0.051318138055062586, -0.052680967276964925, 0.07580638587227902, -0.10896199385558113, 0.044167795380689955, -0.03584703712688411, -0.042858586094954416, 0.04106831610516199, -0.048010457525553114, -0.007117228396777186, -0.05631182080455565, 0.04272630192979813, -0.068361509519826, 0.013100539998457669, 0.013583091572854604, -0.013199021095394144, 0.12143174435400392, -0.006482208766151323, 0.0006704295028053561, -0.08924158927390125, 0.009949080547068043, -0.03468138817646762, -0.08226276875201669, -0.08542114138853399, 0.022535570036232133, -0.03468100225875508, 0.06161853816939467, 0.021504556562304426, -0.024759966682261138, 0.033557474895913514, 0.10179943565296774, -0.045246228547906706, -0.05851252172635426, 0.038275593464446964, -0.02037159898604286, -0.040235004967222154, 0.09910590746678145, -0.10790972979196962, -0.026757804943423592, -0.04353640617058544, -0.018707072608641483, -0.004436089605429676, -0.05958450049651939, -0.002167104200388753, -0.02037359206736436, 0.0389087118894407, -0.015911956842152963, 0.019807794194199098, -0.05383545128971872, -0.05068707215047666, -0.004191677338855124, 0.007600628155065266, -0.03252974762659842, -0.06025197640964512, 0.013786861683383328, 0.004267751636779832, -0.0781393950004214, -0.005412580211360017, 0.004188400022122401, -0.08149779499886534, 0.07360909412294953, -0.04077088256057332, -0.004905909696202504, -0.0028922865993434156, -0.02012044824392077, -0.03035275318006054, 0.020740137648612978, -0.05703918043314872, 0.015110615840903854, 0.04681543992806472, 0.10656807276515465, 0.03374699966919759, 0.07475125472288138, 0.09762569225617805, -0.08214164765012169, -0.044722037659123276, -0.0508063450774804, -0.01955097933917333, -0.008507152884766134, 0.019702604213803127, -0.02085916721392437, -0.046358569882211514, -0.024447417228358123, -0.05031551603528849, -0.013343513776143295], \"yaxis\": \"y\"}],                        {\"legend\": {\"tracegroupgap\": 0}, \"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2d\"}], \"histogram2dcontour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2dcontour\"}], \"mesh3d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"mesh3d\"}], \"parcoords\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"parcoords\"}], \"pie\": [{\"automargin\": true, \"type\": \"pie\"}], \"scatter\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter\"}], \"scatter3d\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter3d\"}], \"scattercarpet\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattercarpet\"}], \"scattergeo\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergeo\"}], \"scattergl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergl\"}], \"scattermapbox\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattermapbox\"}], \"scatterpolar\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolar\"}], \"scatterpolargl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolargl\"}], \"scatterternary\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterternary\"}], \"surface\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"surface\"}], \"table\": [{\"cells\": {\"fill\": {\"color\": \"#EBF0F8\"}, \"line\": {\"color\": \"white\"}}, \"header\": {\"fill\": {\"color\": \"#C8D4E3\"}, \"line\": {\"color\": \"white\"}}, \"type\": \"table\"}]}, \"layout\": {\"annotationdefaults\": {\"arrowcolor\": \"#2a3f5f\", \"arrowhead\": 0, \"arrowwidth\": 1}, \"coloraxis\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"colorscale\": {\"diverging\": [[0, \"#8e0152\"], [0.1, \"#c51b7d\"], [0.2, \"#de77ae\"], [0.3, \"#f1b6da\"], [0.4, \"#fde0ef\"], [0.5, \"#f7f7f7\"], [0.6, \"#e6f5d0\"], [0.7, \"#b8e186\"], [0.8, \"#7fbc41\"], [0.9, \"#4d9221\"], [1, \"#276419\"]], \"sequential\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"sequentialminus\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"colorway\": [\"#636efa\", \"#EF553B\", \"#00cc96\", \"#ab63fa\", \"#FFA15A\", \"#19d3f3\", \"#FF6692\", \"#B6E880\", \"#FF97FF\", \"#FECB52\"], \"font\": {\"color\": \"#2a3f5f\"}, \"geo\": {\"bgcolor\": \"white\", \"lakecolor\": \"white\", \"landcolor\": \"#E5ECF6\", \"showlakes\": true, \"showland\": true, \"subunitcolor\": \"white\"}, \"hoverlabel\": {\"align\": \"left\"}, \"hovermode\": \"closest\", \"mapbox\": {\"style\": \"light\"}, \"paper_bgcolor\": \"white\", \"plot_bgcolor\": \"#E5ECF6\", \"polar\": {\"angularaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"radialaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"scene\": {\"xaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"yaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"zaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}}, \"shapedefaults\": {\"line\": {\"color\": \"#2a3f5f\"}}, \"ternary\": {\"aaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"baxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"caxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"title\": {\"x\": 0.05}, \"xaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}, \"yaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}}}, \"title\": {\"text\": \"MDS Coordinate 2 (y-axis) compared to Window (x-axis)\"}, \"xaxis\": {\"anchor\": \"y\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"x\"}}, \"yaxis\": {\"anchor\": \"x\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"y\"}}},                        {\"responsive\": true}                    ).then(function(){\n",
       "                            \n",
       "var gd = document.getElementById('bb939446-0d81-463a-8a94-e74875edc9a9');\n",
       "var x = new MutationObserver(function (mutations, observer) {{\n",
       "        var display = window.getComputedStyle(gd).display;\n",
       "        if (!display || display === 'none') {{\n",
       "            console.log([gd, 'removed!']);\n",
       "            Plotly.purge(gd);\n",
       "            observer.disconnect();\n",
       "        }}\n",
       "}});\n",
       "\n",
       "// Listen for the removal of the full notebook cells\n",
       "var notebookContainer = gd.closest('#notebook-container');\n",
       "if (notebookContainer) {{\n",
       "    x.observe(notebookContainer, {childList: true});\n",
       "}}\n",
       "\n",
       "// Listen for the clearing of the current output cell\n",
       "var outputEl = gd.closest('.output');\n",
       "if (outputEl) {{\n",
       "    x.observe(outputEl, {childList: true});\n",
       "}}\n",
       "\n",
       "                        })                };                });            </script>        </div>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "px.scatter(y=mds.samples[\"PC2\"], title=\"MDS Coordinate 2 (y-axis) compared to Window (x-axis)\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>                            <div id=\"2fa169ed-2880-4cbf-83e9-81c7946b2ced\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div>            <script type=\"text/javascript\">                require([\"plotly\"], function(Plotly) {                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById(\"2fa169ed-2880-4cbf-83e9-81c7946b2ced\")) {                    Plotly.newPlot(                        \"2fa169ed-2880-4cbf-83e9-81c7946b2ced\",                        [{\"hovertemplate\": \"x=%{x}<br>y=%{y}<extra></extra>\", \"legendgroup\": \"\", \"marker\": {\"color\": \"#636efa\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"\", \"orientation\": \"v\", \"showlegend\": false, \"type\": \"scatter\", \"x\": [0.10328071630058908, 0.0650479248725926, -0.007394106598915255, -0.006157734405445993, 0.030486759245616054, -0.052697883748815746, -0.019532195114048374, 0.10731489173784366, -0.045747016700497425, 0.05232496900485219, -0.10842996248618392, -0.012932329719601952, 0.04630725443312959, 0.0713363949570614, 0.0232421287307101, -0.008386021663101888, -0.045461178095005314, 0.07517237748421035, 0.0332832653482144, -0.00464769930238915, 0.09244351798292504, 0.05328536847518314, -0.06764070547396611, 0.009697491880571245, 0.07316624137339647, 0.061255843644709575, 0.020300517750714276, -0.1421031649097082, 0.026228777140329878, -0.022514796338087593, -0.06052430046525878, -0.005638655371737583, -0.03789426904973051, -0.26128388065099417, -0.011435430763923492, -0.096027993633076, -0.051979100902621214, -0.019041092443677295, 0.014928264457918042, -0.045080298703791676, -0.02157385679489578, -0.07837639643185061, -0.0936522207464769, 0.02254911945685126, -0.0811184297826174, -0.06026163221142208, -0.06135711735706212, 0.05124176546518588, -0.11034190721868777, 0.04942027722185122, -0.006800316932454283, -0.0450365793277635, -0.002580493904349241, 0.047480809630117096, 0.018229051470887193, 0.015323735519900508, -0.10491699613058116, -0.010977527633032964, 0.02905633619543364, -0.10260878154655098, 0.0007373597967201738, -0.07676325094849808, -0.059763729316446274, 0.005978345010026969, 0.004451055073261316, 0.012649239195900166, 0.018363346197186534, -0.016892193247203768, -0.0018180681629584832, -0.09286617480763365, 0.051524449155064184, 0.07652275236295818, 0.05348911734730026, 0.013909413003526622, -0.015459045289710009, 0.017182337028950622, 0.10505052960021619, -0.0962579768450507, 0.020029323812104205, -0.0874099639144895, 0.03143331440415039, 0.03386962467646718, -0.0499833273717695, -0.03602212849884945, -0.002822801181295588, 0.00977488842740034, 0.01128253169722742, 0.07758374666886007, 0.06393887161447563, 0.0005884095034402356, 0.04086179301355499, -0.04464763191980178, 0.06865312112701832, 0.09193286524055753, -0.01748611026806448, 0.04763226317586455, 0.02756224580878249, -0.03907294771166091, -0.07896282387662465, -0.09588607288563603, 0.020648615068449123, 0.023385787148913286, -0.07791160503505776, 0.03903424756155953, 0.08748900720869043, 0.0648073951032875, 0.08733205456726416, -0.11932100052943416, 0.0009908575897407317, 0.06109398053549187, 0.12669016268582342, 0.057347209767974076, -0.08037714028084723, -0.007260718834142317, 0.053458225481735525, 0.0191608345738471, 0.08699909043651556, -0.002836034415763903, 0.055844193223345606, 0.020623667595681024, -0.029100731293872795, 0.04399736659910032, 0.03621915221245034, 0.07854695911145614], \"xaxis\": \"x\", \"y\": [-0.0272889123126008, 0.07351808816163832, -0.04132701201880126, 0.04705603238535642, -0.02113906621000458, 0.07146387390284675, 0.12346131807694984, 0.0906331655558465, -0.06913438701795134, -0.019033738812695343, -0.009471983657167974, 0.06193898688026216, 0.07292036158608256, 0.06578754224807705, -0.0006577184845889437, 0.02676760841256399, 0.06289571245250154, -0.0015655315805959027, -0.003325879143097108, 0.14853896740085593, 0.004299589543028834, 0.035664904018845735, -0.0026343055625691956, -0.05192972049451219, 0.02153884019443099, -0.019578707469464742, 0.09156186207991591, 0.044279755771083056, 0.11822415906969197, -0.12082079553854412, 0.06030770413311747, -0.01402836703417489, 0.11709651469176459, -0.042797266550502165, -0.058508135416571974, -0.0976076240109346, 0.02891813010324901, 0.026561925020731382, -0.0237270482546584, 0.051318138055062586, -0.052680967276964925, 0.07580638587227902, -0.10896199385558113, 0.044167795380689955, -0.03584703712688411, -0.042858586094954416, 0.04106831610516199, -0.048010457525553114, -0.007117228396777186, -0.05631182080455565, 0.04272630192979813, -0.068361509519826, 0.013100539998457669, 0.013583091572854604, -0.013199021095394144, 0.12143174435400392, -0.006482208766151323, 0.0006704295028053561, -0.08924158927390125, 0.009949080547068043, -0.03468138817646762, -0.08226276875201669, -0.08542114138853399, 0.022535570036232133, -0.03468100225875508, 0.06161853816939467, 0.021504556562304426, -0.024759966682261138, 0.033557474895913514, 0.10179943565296774, -0.045246228547906706, -0.05851252172635426, 0.038275593464446964, -0.02037159898604286, -0.040235004967222154, 0.09910590746678145, -0.10790972979196962, -0.026757804943423592, -0.04353640617058544, -0.018707072608641483, -0.004436089605429676, -0.05958450049651939, -0.002167104200388753, -0.02037359206736436, 0.0389087118894407, -0.015911956842152963, 0.019807794194199098, -0.05383545128971872, -0.05068707215047666, -0.004191677338855124, 0.007600628155065266, -0.03252974762659842, -0.06025197640964512, 0.013786861683383328, 0.004267751636779832, -0.0781393950004214, -0.005412580211360017, 0.004188400022122401, -0.08149779499886534, 0.07360909412294953, -0.04077088256057332, -0.004905909696202504, -0.0028922865993434156, -0.02012044824392077, -0.03035275318006054, 0.020740137648612978, -0.05703918043314872, 0.015110615840903854, 0.04681543992806472, 0.10656807276515465, 0.03374699966919759, 0.07475125472288138, 0.09762569225617805, -0.08214164765012169, -0.044722037659123276, -0.0508063450774804, -0.01955097933917333, -0.008507152884766134, 0.019702604213803127, -0.02085916721392437, -0.046358569882211514, -0.024447417228358123, -0.05031551603528849, -0.013343513776143295], \"yaxis\": \"y\"}],                        {\"legend\": {\"tracegroupgap\": 0}, \"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2d\"}], \"histogram2dcontour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2dcontour\"}], \"mesh3d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"mesh3d\"}], \"parcoords\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"parcoords\"}], \"pie\": [{\"automargin\": true, \"type\": \"pie\"}], \"scatter\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter\"}], \"scatter3d\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter3d\"}], \"scattercarpet\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattercarpet\"}], \"scattergeo\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergeo\"}], \"scattergl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergl\"}], \"scattermapbox\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattermapbox\"}], \"scatterpolar\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolar\"}], \"scatterpolargl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolargl\"}], \"scatterternary\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterternary\"}], \"surface\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"surface\"}], \"table\": [{\"cells\": {\"fill\": {\"color\": \"#EBF0F8\"}, \"line\": {\"color\": \"white\"}}, \"header\": {\"fill\": {\"color\": \"#C8D4E3\"}, \"line\": {\"color\": \"white\"}}, \"type\": \"table\"}]}, \"layout\": {\"annotationdefaults\": {\"arrowcolor\": \"#2a3f5f\", \"arrowhead\": 0, \"arrowwidth\": 1}, \"coloraxis\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"colorscale\": {\"diverging\": [[0, \"#8e0152\"], [0.1, \"#c51b7d\"], [0.2, \"#de77ae\"], [0.3, \"#f1b6da\"], [0.4, \"#fde0ef\"], [0.5, \"#f7f7f7\"], [0.6, \"#e6f5d0\"], [0.7, \"#b8e186\"], [0.8, \"#7fbc41\"], [0.9, \"#4d9221\"], [1, \"#276419\"]], \"sequential\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"sequentialminus\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"colorway\": [\"#636efa\", \"#EF553B\", \"#00cc96\", \"#ab63fa\", \"#FFA15A\", \"#19d3f3\", \"#FF6692\", \"#B6E880\", \"#FF97FF\", \"#FECB52\"], \"font\": {\"color\": \"#2a3f5f\"}, \"geo\": {\"bgcolor\": \"white\", \"lakecolor\": \"white\", \"landcolor\": \"#E5ECF6\", \"showlakes\": true, \"showland\": true, \"subunitcolor\": \"white\"}, \"hoverlabel\": {\"align\": \"left\"}, \"hovermode\": \"closest\", \"mapbox\": {\"style\": \"light\"}, \"paper_bgcolor\": \"white\", \"plot_bgcolor\": \"#E5ECF6\", \"polar\": {\"angularaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"radialaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"scene\": {\"xaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"yaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"zaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}}, \"shapedefaults\": {\"line\": {\"color\": \"#2a3f5f\"}}, \"ternary\": {\"aaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"baxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"caxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"title\": {\"x\": 0.05}, \"xaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}, \"yaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}}}, \"title\": {\"text\": \"MDS Coordinate 1 (x-axis) and MDS Coordinate 2 (y-axis)\"}, \"xaxis\": {\"anchor\": \"y\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"x\"}}, \"yaxis\": {\"anchor\": \"x\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"y\"}}},                        {\"responsive\": true}                    ).then(function(){\n",
       "                            \n",
       "var gd = document.getElementById('2fa169ed-2880-4cbf-83e9-81c7946b2ced');\n",
       "var x = new MutationObserver(function (mutations, observer) {{\n",
       "        var display = window.getComputedStyle(gd).display;\n",
       "        if (!display || display === 'none') {{\n",
       "            console.log([gd, 'removed!']);\n",
       "            Plotly.purge(gd);\n",
       "            observer.disconnect();\n",
       "        }}\n",
       "}});\n",
       "\n",
       "// Listen for the removal of the full notebook cells\n",
       "var notebookContainer = gd.closest('#notebook-container');\n",
       "if (notebookContainer) {{\n",
       "    x.observe(notebookContainer, {childList: true});\n",
       "}}\n",
       "\n",
       "// Listen for the clearing of the current output cell\n",
       "var outputEl = gd.closest('.output');\n",
       "if (outputEl) {{\n",
       "    x.observe(outputEl, {childList: true});\n",
       "}}\n",
       "\n",
       "                        })                };                });            </script>        </div>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "px.scatter(x=mds.samples[\"PC1\"], y=mds.samples[\"PC2\"], title=\"MDS Coordinate 1 (x-axis) and MDS Coordinate 2 (y-axis)\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Performing Analaysis Genome-Wide"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "landmarks = ls.get_landmarks(\"test_data/complete_file.vcf.gz\")\n",
    "\n",
    "results = list()\n",
    "snp_positions = list()\n",
    "\n",
    "for landmark in landmarks:\n",
    "    windows, positions = ls.parse_vcf(\"test_data/complete_file.vcf.gz\", landmark, 95)\n",
    "    for i, window in enumerate(windows):\n",
    "        results.append(ls.eigen_windows(window, 10, 1))\n",
    "        snp_positions.append(positions[i])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "While the above will not work due to a missing file, it is the appropriate way to get the results for each window for all landmarks (chromosomes, scaffolds, contigs, etc...). Here, we keep track of snp_positions as well, and len(snp_positions) == len(results) so they can be further investigated.\n",
    "\n",
    "The code will then remain the same:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Convert to numpy array\n",
    "results = np.vstack(results)\n",
    "\n",
    "# Get PCA distances comparison matrix\n",
    "pc_dists = ls.get_pc_dists(results)\n",
    "\n",
    "# Get PCoA value of pc_dists matrix (this is equivalent to R's MDS)\n",
    "mds = pcoa(pc_dists)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Comparison to R Version"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.9971509982243155"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "mds_coords = pd.read_csv(\"lostruct-results/mds_coords.csv\")\n",
    "np.corrcoef(mds.samples['PC1'], mds_coords['MDS1'].to_numpy())[0][1]\n",
    "# R-value is:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>                            <div id=\"cf439140-5d3c-47ef-a613-15eebfbb2223\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div>            <script type=\"text/javascript\">                require([\"plotly\"], function(Plotly) {                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById(\"cf439140-5d3c-47ef-a613-15eebfbb2223\")) {                    Plotly.newPlot(                        \"cf439140-5d3c-47ef-a613-15eebfbb2223\",                        [{\"hovertemplate\": \"x=%{x}<br>y=%{y}<extra></extra>\", \"legendgroup\": \"\", \"marker\": {\"color\": \"#636efa\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"\", \"orientation\": \"v\", \"showlegend\": false, \"type\": \"scatter\", \"x\": [0.10328071630058908, 0.0650479248725926, -0.007394106598915255, -0.006157734405445993, 0.030486759245616054, -0.052697883748815746, -0.019532195114048374, 0.10731489173784366, -0.045747016700497425, 0.05232496900485219, -0.10842996248618392, -0.012932329719601952, 0.04630725443312959, 0.0713363949570614, 0.0232421287307101, -0.008386021663101888, -0.045461178095005314, 0.07517237748421035, 0.0332832653482144, -0.00464769930238915, 0.09244351798292504, 0.05328536847518314, -0.06764070547396611, 0.009697491880571245, 0.07316624137339647, 0.061255843644709575, 0.020300517750714276, -0.1421031649097082, 0.026228777140329878, -0.022514796338087593, -0.06052430046525878, -0.005638655371737583, -0.03789426904973051, -0.26128388065099417, -0.011435430763923492, -0.096027993633076, -0.051979100902621214, -0.019041092443677295, 0.014928264457918042, -0.045080298703791676, -0.02157385679489578, -0.07837639643185061, -0.0936522207464769, 0.02254911945685126, -0.0811184297826174, -0.06026163221142208, -0.06135711735706212, 0.05124176546518588, -0.11034190721868777, 0.04942027722185122, -0.006800316932454283, -0.0450365793277635, -0.002580493904349241, 0.047480809630117096, 0.018229051470887193, 0.015323735519900508, -0.10491699613058116, -0.010977527633032964, 0.02905633619543364, -0.10260878154655098, 0.0007373597967201738, -0.07676325094849808, -0.059763729316446274, 0.005978345010026969, 0.004451055073261316, 0.012649239195900166, 0.018363346197186534, -0.016892193247203768, -0.0018180681629584832, -0.09286617480763365, 0.051524449155064184, 0.07652275236295818, 0.05348911734730026, 0.013909413003526622, -0.015459045289710009, 0.017182337028950622, 0.10505052960021619, -0.0962579768450507, 0.020029323812104205, -0.0874099639144895, 0.03143331440415039, 0.03386962467646718, -0.0499833273717695, -0.03602212849884945, -0.002822801181295588, 0.00977488842740034, 0.01128253169722742, 0.07758374666886007, 0.06393887161447563, 0.0005884095034402356, 0.04086179301355499, -0.04464763191980178, 0.06865312112701832, 0.09193286524055753, -0.01748611026806448, 0.04763226317586455, 0.02756224580878249, -0.03907294771166091, -0.07896282387662465, -0.09588607288563603, 0.020648615068449123, 0.023385787148913286, -0.07791160503505776, 0.03903424756155953, 0.08748900720869043, 0.0648073951032875, 0.08733205456726416, -0.11932100052943416, 0.0009908575897407317, 0.06109398053549187, 0.12669016268582342, 0.057347209767974076, -0.08037714028084723, -0.007260718834142317, 0.053458225481735525, 0.0191608345738471, 0.08699909043651556, -0.002836034415763903, 0.055844193223345606, 0.020623667595681024, -0.029100731293872795, 0.04399736659910032, 0.03621915221245034, 0.07854695911145614], \"xaxis\": \"x\", \"y\": [0.106039412140135, 0.06521785477816, -0.004399464291748, -0.0031844036766112897, 0.037562557252513, -0.0594637921340835, -0.0183053822281976, 0.0980611459027024, -0.0430187784148828, 0.0538087738618379, -0.107933235761886, -0.0114377128051263, 0.0391079361981341, 0.0727715030719605, 0.0192915851515999, -0.007734360756535009, -0.0454173469988564, 0.0785915179041593, 0.0361093027056911, -0.0105815826097926, 0.0857164277740816, 0.0572546213514705, -0.0688891823189553, 0.0114596154278772, 0.0783654038927575, 0.066358972060522, 0.0208990177695049, -0.137115297033866, 0.0156172902321442, -0.0177812740238417, -0.0564880260378318, -0.0026786776458018803, -0.0338378975242213, -0.256142720380728, -0.00684101878435677, -0.0918822135003576, -0.0474866333052684, -0.0189046450454139, 0.0169740368671499, -0.0378385331957417, -0.0215109014703824, -0.0786846496375569, -0.089950493985065, 0.0242317772445913, -0.0798279587463118, -0.0561721187820339, -0.0629564633806749, 0.0554620024115496, -0.10973477473028001, 0.0549149135120433, -0.00330911810470405, -0.0425310794030861, 0.00343947976742972, 0.0377505600572558, 0.0229678574490893, 0.0161043728293765, -0.105343130093718, -0.00997168608900377, 0.0346729997575843, -0.10082793252549199, -0.0032379121551334104, -0.0737757905866874, -0.0578603416950295, 0.0060995036624745, -0.0010437565148827, 0.0172704365769281, 0.0217120178697539, -0.0189070548696905, -0.0023676015888738897, -0.10293618640513601, 0.054633566654237, 0.0809034420798704, 0.0505074834979319, 0.0109970575589052, -0.0201640913565209, 0.0197911669719884, 0.10760336367800201, -0.0953067898831284, 0.0127158279335449, -0.0879299232518779, 0.0337475240719632, 0.0294298093071234, -0.0508544564040558, -0.0430072802586381, -0.00949174857091432, 0.00957252940953021, 0.0131248952185619, 0.0825694544628294, 0.0559785128209545, 0.00372231827392765, 0.0329810401895892, -0.04252459598035701, 0.0718759470800733, 0.0939022068688582, -0.0145276135904549, 0.0384668259431337, 0.0286416052802563, -0.0395822205872374, -0.0742552786230123, -0.0951313187600025, 0.0110860485252388, 0.0269023066976898, -0.0773581764618903, 0.0392419412770702, 0.0835299504490291, 0.0671986276988443, 0.0823973390257787, -0.117061828377013, -0.00495675222087029, 0.0618777983773445, 0.101222901143372, 0.0606271010195033, -0.0819193923475441, -0.00429034130166789, 0.051539511649676, 0.0144034031373898, 0.0817193109583082, -0.00243186192438948, 0.0519611133189414, 0.0222608416730319, -0.0260896229419643, 0.0397841750931153, 0.0389154896127699, 0.07552908964051899], \"yaxis\": \"y\"}],                        {\"legend\": {\"tracegroupgap\": 0}, \"margin\": {\"t\": 60}, \"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2d\"}], \"histogram2dcontour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2dcontour\"}], \"mesh3d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"mesh3d\"}], \"parcoords\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"parcoords\"}], \"pie\": [{\"automargin\": true, \"type\": \"pie\"}], \"scatter\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter\"}], \"scatter3d\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter3d\"}], \"scattercarpet\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattercarpet\"}], \"scattergeo\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergeo\"}], \"scattergl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergl\"}], \"scattermapbox\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattermapbox\"}], \"scatterpolar\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolar\"}], \"scatterpolargl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolargl\"}], \"scatterternary\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterternary\"}], \"surface\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"surface\"}], \"table\": [{\"cells\": {\"fill\": {\"color\": \"#EBF0F8\"}, \"line\": {\"color\": \"white\"}}, \"header\": {\"fill\": {\"color\": \"#C8D4E3\"}, \"line\": {\"color\": \"white\"}}, \"type\": \"table\"}]}, \"layout\": {\"annotationdefaults\": {\"arrowcolor\": \"#2a3f5f\", \"arrowhead\": 0, \"arrowwidth\": 1}, \"coloraxis\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"colorscale\": {\"diverging\": [[0, \"#8e0152\"], [0.1, \"#c51b7d\"], [0.2, \"#de77ae\"], [0.3, \"#f1b6da\"], [0.4, \"#fde0ef\"], [0.5, \"#f7f7f7\"], [0.6, \"#e6f5d0\"], [0.7, \"#b8e186\"], [0.8, \"#7fbc41\"], [0.9, \"#4d9221\"], [1, \"#276419\"]], \"sequential\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"sequentialminus\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"colorway\": [\"#636efa\", \"#EF553B\", \"#00cc96\", \"#ab63fa\", \"#FFA15A\", \"#19d3f3\", \"#FF6692\", \"#B6E880\", \"#FF97FF\", \"#FECB52\"], \"font\": {\"color\": \"#2a3f5f\"}, \"geo\": {\"bgcolor\": \"white\", \"lakecolor\": \"white\", \"landcolor\": \"#E5ECF6\", \"showlakes\": true, \"showland\": true, \"subunitcolor\": \"white\"}, \"hoverlabel\": {\"align\": \"left\"}, \"hovermode\": \"closest\", \"mapbox\": {\"style\": \"light\"}, \"paper_bgcolor\": \"white\", \"plot_bgcolor\": \"#E5ECF6\", \"polar\": {\"angularaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"radialaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"scene\": {\"xaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"yaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"zaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}}, \"shapedefaults\": {\"line\": {\"color\": \"#2a3f5f\"}}, \"ternary\": {\"aaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"baxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"caxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"title\": {\"x\": 0.05}, \"xaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}, \"yaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}}}, \"xaxis\": {\"anchor\": \"y\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"x\"}}, \"yaxis\": {\"anchor\": \"x\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"y\"}}},                        {\"responsive\": true}                    ).then(function(){\n",
       "                            \n",
       "var gd = document.getElementById('cf439140-5d3c-47ef-a613-15eebfbb2223');\n",
       "var x = new MutationObserver(function (mutations, observer) {{\n",
       "        var display = window.getComputedStyle(gd).display;\n",
       "        if (!display || display === 'none') {{\n",
       "            console.log([gd, 'removed!']);\n",
       "            Plotly.purge(gd);\n",
       "            observer.disconnect();\n",
       "        }}\n",
       "}});\n",
       "\n",
       "// Listen for the removal of the full notebook cells\n",
       "var notebookContainer = gd.closest('#notebook-container');\n",
       "if (notebookContainer) {{\n",
       "    x.observe(notebookContainer, {childList: true});\n",
       "}}\n",
       "\n",
       "// Listen for the clearing of the current output cell\n",
       "var outputEl = gd.closest('.output');\n",
       "if (outputEl) {{\n",
       "    x.observe(outputEl, {childList: true});\n",
       "}}\n",
       "\n",
       "                        })                };                });            </script>        </div>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "px.scatter(x=mds.samples[\"PC1\"], y=mds_coords['MDS1'])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Working with Large Datasets"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "-0.9972686515756828"
      ]
     },
     "execution_count": 25,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# PCOA for reduced memory consumption and faster clustering\n",
    "mds = pcoa(pc_dists, method=\"fsvd\", inplace=True, number_of_dimensions=10)\n",
    "np.corrcoef(mds.samples[\"PC1\"], mds_coords['MDS1'].to_numpy())[0][1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>                            <div id=\"bf95568a-677c-4f4b-8768-760f6b77ae72\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div>            <script type=\"text/javascript\">                require([\"plotly\"], function(Plotly) {                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById(\"bf95568a-677c-4f4b-8768-760f6b77ae72\")) {                    Plotly.newPlot(                        \"bf95568a-677c-4f4b-8768-760f6b77ae72\",                        [{\"hovertemplate\": \"variable=wide_variable_0<br>index=%{x}<br>value=%{y}<extra></extra>\", \"legendgroup\": \"wide_variable_0\", \"marker\": {\"color\": \"#636efa\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"wide_variable_0\", \"orientation\": \"v\", \"showlegend\": true, \"type\": \"scatter\", \"x\": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123], \"xaxis\": \"x\", \"y\": [-0.10393079711633689, -0.0644672989743639, 0.007104244852016054, 0.005852594043551944, -0.03106638523414614, 0.05358955525364661, 0.019226973699728245, -0.1068125327928678, 0.04653417244282402, -0.051185608504103045, 0.10828205406784398, 0.01332856633409102, -0.04666870753512105, -0.07143882973130525, -0.02361658670817797, 0.008565043440238403, 0.04583621493624949, -0.07599488643158943, -0.03338748779788952, 0.004333546871594212, -0.09182572316517874, -0.05279170267090738, 0.06761016095873573, -0.009716010473436542, -0.07342656422658342, -0.061906213833211605, -0.02067858941988534, 0.14104443066802813, -0.026229057957139493, 0.023861622685781285, 0.060719715137172274, 0.00630837724907209, 0.036785438178418554, 0.26133182659553605, 0.010954976260310676, 0.09614649638211897, 0.052132314550340716, 0.01795728198313163, -0.015462756057323283, 0.04705118923702312, 0.021460785548749625, 0.07955520146167806, 0.09340064671667633, -0.022932211373297495, 0.08176782832971767, 0.060589265800649675, 0.06134008186708731, -0.05163287414941756, 0.11003713319104846, -0.049850817686692486, 0.007128634706508281, 0.04453164119670596, 0.0026720007710667308, -0.04710886439926606, -0.018664794265113548, -0.014803608445961685, 0.10378722755109356, 0.011630883965368426, -0.029154225984728607, 0.10330910774446309, -0.0013070147490536522, 0.07576130826141586, 0.05926802830813155, -0.0063201576010883595, -0.004247347480396322, -0.01303218496015789, -0.018470632021347813, 0.015884117609748227, 0.0015973064788465806, 0.09276285862326195, -0.05141460194228941, -0.07659511662458693, -0.05322263137394796, -0.01402642879496487, 0.015593640174401164, -0.017750118766065005, -0.1048308484174918, 0.09569192406158909, -0.01967267470481505, 0.08834676817722503, -0.03189249182405665, -0.03349449955224019, 0.0510908402563699, 0.036342036877302815, 0.0035719114185031285, -0.010506936351628436, -0.011283081594089153, -0.07813046710462643, -0.06330473264281147, -2.320107732899425e-05, -0.04024965582710512, 0.0453642115575422, -0.06870965062455738, -0.0916284724225208, 0.017984900192343015, -0.04777191964888403, -0.027399168814895417, 0.03973197423982784, 0.07886665999248689, 0.09564300760430544, -0.019939307750700064, -0.023703477119591518, 0.07709893167729398, -0.03897568533093606, -0.08786568854598883, -0.06522689236160806, -0.08735248768538476, 0.11908305319349294, -0.0010668273716483232, -0.06111335228229303, -0.12541580785326875, -0.05805305376044064, 0.07978349071920547, 0.007204324513079984, -0.05323495107011391, -0.01889905738580896, -0.08727294491219119, 0.0031868497158194877, -0.055853081132030115, -0.019862728723933614, 0.029167396301423985, -0.044683963575325635, -0.036911694686428805, -0.07932460322919993], \"yaxis\": \"y\"}, {\"hovertemplate\": \"variable=wide_variable_1<br>index=%{x}<br>value=%{y}<extra></extra>\", \"legendgroup\": \"wide_variable_1\", \"marker\": {\"color\": \"#EF553B\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"wide_variable_1\", \"orientation\": \"v\", \"showlegend\": true, \"type\": \"scatter\", \"x\": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123], \"xaxis\": \"x\", \"y\": [0.106039412140135, 0.06521785477816, -0.004399464291748, -0.0031844036766112897, 0.037562557252513, -0.0594637921340835, -0.0183053822281976, 0.0980611459027024, -0.0430187784148828, 0.0538087738618379, -0.107933235761886, -0.0114377128051263, 0.0391079361981341, 0.0727715030719605, 0.0192915851515999, -0.007734360756535009, -0.0454173469988564, 0.0785915179041593, 0.0361093027056911, -0.0105815826097926, 0.0857164277740816, 0.0572546213514705, -0.0688891823189553, 0.0114596154278772, 0.0783654038927575, 0.066358972060522, 0.0208990177695049, -0.137115297033866, 0.0156172902321442, -0.0177812740238417, -0.0564880260378318, -0.0026786776458018803, -0.0338378975242213, -0.256142720380728, -0.00684101878435677, -0.0918822135003576, -0.0474866333052684, -0.0189046450454139, 0.0169740368671499, -0.0378385331957417, -0.0215109014703824, -0.0786846496375569, -0.089950493985065, 0.0242317772445913, -0.0798279587463118, -0.0561721187820339, -0.0629564633806749, 0.0554620024115496, -0.10973477473028001, 0.0549149135120433, -0.00330911810470405, -0.0425310794030861, 0.00343947976742972, 0.0377505600572558, 0.0229678574490893, 0.0161043728293765, -0.105343130093718, -0.00997168608900377, 0.0346729997575843, -0.10082793252549199, -0.0032379121551334104, -0.0737757905866874, -0.0578603416950295, 0.0060995036624745, -0.0010437565148827, 0.0172704365769281, 0.0217120178697539, -0.0189070548696905, -0.0023676015888738897, -0.10293618640513601, 0.054633566654237, 0.0809034420798704, 0.0505074834979319, 0.0109970575589052, -0.0201640913565209, 0.0197911669719884, 0.10760336367800201, -0.0953067898831284, 0.0127158279335449, -0.0879299232518779, 0.0337475240719632, 0.0294298093071234, -0.0508544564040558, -0.0430072802586381, -0.00949174857091432, 0.00957252940953021, 0.0131248952185619, 0.0825694544628294, 0.0559785128209545, 0.00372231827392765, 0.0329810401895892, -0.04252459598035701, 0.0718759470800733, 0.0939022068688582, -0.0145276135904549, 0.0384668259431337, 0.0286416052802563, -0.0395822205872374, -0.0742552786230123, -0.0951313187600025, 0.0110860485252388, 0.0269023066976898, -0.0773581764618903, 0.0392419412770702, 0.0835299504490291, 0.0671986276988443, 0.0823973390257787, -0.117061828377013, -0.00495675222087029, 0.0618777983773445, 0.101222901143372, 0.0606271010195033, -0.0819193923475441, -0.00429034130166789, 0.051539511649676, 0.0144034031373898, 0.0817193109583082, -0.00243186192438948, 0.0519611133189414, 0.0222608416730319, -0.0260896229419643, 0.0397841750931153, 0.0389154896127699, 0.07552908964051899], \"yaxis\": \"y\"}],                        {\"legend\": {\"title\": {\"text\": \"variable\"}, \"tracegroupgap\": 0}, \"margin\": {\"t\": 60}, \"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2d\"}], \"histogram2dcontour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2dcontour\"}], \"mesh3d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"mesh3d\"}], \"parcoords\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"parcoords\"}], \"pie\": [{\"automargin\": true, \"type\": \"pie\"}], \"scatter\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter\"}], \"scatter3d\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter3d\"}], \"scattercarpet\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattercarpet\"}], \"scattergeo\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergeo\"}], \"scattergl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergl\"}], \"scattermapbox\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattermapbox\"}], \"scatterpolar\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolar\"}], \"scatterpolargl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolargl\"}], \"scatterternary\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterternary\"}], \"surface\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"surface\"}], \"table\": [{\"cells\": {\"fill\": {\"color\": \"#EBF0F8\"}, \"line\": {\"color\": \"white\"}}, \"header\": {\"fill\": {\"color\": \"#C8D4E3\"}, \"line\": {\"color\": \"white\"}}, \"type\": \"table\"}]}, \"layout\": {\"annotationdefaults\": {\"arrowcolor\": \"#2a3f5f\", \"arrowhead\": 0, \"arrowwidth\": 1}, \"coloraxis\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"colorscale\": {\"diverging\": [[0, \"#8e0152\"], [0.1, \"#c51b7d\"], [0.2, \"#de77ae\"], [0.3, \"#f1b6da\"], [0.4, \"#fde0ef\"], [0.5, \"#f7f7f7\"], [0.6, \"#e6f5d0\"], [0.7, \"#b8e186\"], [0.8, \"#7fbc41\"], [0.9, \"#4d9221\"], [1, \"#276419\"]], \"sequential\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"sequentialminus\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"colorway\": [\"#636efa\", \"#EF553B\", \"#00cc96\", \"#ab63fa\", \"#FFA15A\", \"#19d3f3\", \"#FF6692\", \"#B6E880\", \"#FF97FF\", \"#FECB52\"], \"font\": {\"color\": \"#2a3f5f\"}, \"geo\": {\"bgcolor\": \"white\", \"lakecolor\": \"white\", \"landcolor\": \"#E5ECF6\", \"showlakes\": true, \"showland\": true, \"subunitcolor\": \"white\"}, \"hoverlabel\": {\"align\": \"left\"}, \"hovermode\": \"closest\", \"mapbox\": {\"style\": \"light\"}, \"paper_bgcolor\": \"white\", \"plot_bgcolor\": \"#E5ECF6\", \"polar\": {\"angularaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"radialaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"scene\": {\"xaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"yaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"zaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}}, \"shapedefaults\": {\"line\": {\"color\": \"#2a3f5f\"}}, \"ternary\": {\"aaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"baxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"caxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"title\": {\"x\": 0.05}, \"xaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}, \"yaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}}}, \"xaxis\": {\"anchor\": \"y\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"index\"}}, \"yaxis\": {\"anchor\": \"x\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"value\"}}},                        {\"responsive\": true}                    ).then(function(){\n",
       "                            \n",
       "var gd = document.getElementById('bf95568a-677c-4f4b-8768-760f6b77ae72');\n",
       "var x = new MutationObserver(function (mutations, observer) {{\n",
       "        var display = window.getComputedStyle(gd).display;\n",
       "        if (!display || display === 'none') {{\n",
       "            console.log([gd, 'removed!']);\n",
       "            Plotly.purge(gd);\n",
       "            observer.disconnect();\n",
       "        }}\n",
       "}});\n",
       "\n",
       "// Listen for the removal of the full notebook cells\n",
       "var notebookContainer = gd.closest('#notebook-container');\n",
       "if (notebookContainer) {{\n",
       "    x.observe(notebookContainer, {childList: true});\n",
       "}}\n",
       "\n",
       "// Listen for the clearing of the current output cell\n",
       "var outputEl = gd.closest('.output');\n",
       "if (outputEl) {{\n",
       "    x.observe(outputEl, {childList: true});\n",
       "}}\n",
       "\n",
       "                        })                };                });            </script>        </div>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "px.scatter(y=[mds.samples[\"PC1\"], mds_coords['MDS1']], title=\"\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>                            <div id=\"1f595a27-299e-4e89-a8d2-f248efb7405f\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div>            <script type=\"text/javascript\">                require([\"plotly\"], function(Plotly) {                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById(\"1f595a27-299e-4e89-a8d2-f248efb7405f\")) {                    Plotly.newPlot(                        \"1f595a27-299e-4e89-a8d2-f248efb7405f\",                        [{\"hovertemplate\": \"x=%{x}<br>y=%{y}<extra></extra>\", \"legendgroup\": \"\", \"marker\": {\"color\": \"#636efa\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"\", \"orientation\": \"v\", \"showlegend\": false, \"type\": \"scatter\", \"x\": [-0.10393079711633689, -0.0644672989743639, 0.007104244852016054, 0.005852594043551944, -0.03106638523414614, 0.05358955525364661, 0.019226973699728245, -0.1068125327928678, 0.04653417244282402, -0.051185608504103045, 0.10828205406784398, 0.01332856633409102, -0.04666870753512105, -0.07143882973130525, -0.02361658670817797, 0.008565043440238403, 0.04583621493624949, -0.07599488643158943, -0.03338748779788952, 0.004333546871594212, -0.09182572316517874, -0.05279170267090738, 0.06761016095873573, -0.009716010473436542, -0.07342656422658342, -0.061906213833211605, -0.02067858941988534, 0.14104443066802813, -0.026229057957139493, 0.023861622685781285, 0.060719715137172274, 0.00630837724907209, 0.036785438178418554, 0.26133182659553605, 0.010954976260310676, 0.09614649638211897, 0.052132314550340716, 0.01795728198313163, -0.015462756057323283, 0.04705118923702312, 0.021460785548749625, 0.07955520146167806, 0.09340064671667633, -0.022932211373297495, 0.08176782832971767, 0.060589265800649675, 0.06134008186708731, -0.05163287414941756, 0.11003713319104846, -0.049850817686692486, 0.007128634706508281, 0.04453164119670596, 0.0026720007710667308, -0.04710886439926606, -0.018664794265113548, -0.014803608445961685, 0.10378722755109356, 0.011630883965368426, -0.029154225984728607, 0.10330910774446309, -0.0013070147490536522, 0.07576130826141586, 0.05926802830813155, -0.0063201576010883595, -0.004247347480396322, -0.01303218496015789, -0.018470632021347813, 0.015884117609748227, 0.0015973064788465806, 0.09276285862326195, -0.05141460194228941, -0.07659511662458693, -0.05322263137394796, -0.01402642879496487, 0.015593640174401164, -0.017750118766065005, -0.1048308484174918, 0.09569192406158909, -0.01967267470481505, 0.08834676817722503, -0.03189249182405665, -0.03349449955224019, 0.0510908402563699, 0.036342036877302815, 0.0035719114185031285, -0.010506936351628436, -0.011283081594089153, -0.07813046710462643, -0.06330473264281147, -2.320107732899425e-05, -0.04024965582710512, 0.0453642115575422, -0.06870965062455738, -0.0916284724225208, 0.017984900192343015, -0.04777191964888403, -0.027399168814895417, 0.03973197423982784, 0.07886665999248689, 0.09564300760430544, -0.019939307750700064, -0.023703477119591518, 0.07709893167729398, -0.03897568533093606, -0.08786568854598883, -0.06522689236160806, -0.08735248768538476, 0.11908305319349294, -0.0010668273716483232, -0.06111335228229303, -0.12541580785326875, -0.05805305376044064, 0.07978349071920547, 0.007204324513079984, -0.05323495107011391, -0.01889905738580896, -0.08727294491219119, 0.0031868497158194877, -0.055853081132030115, -0.019862728723933614, 0.029167396301423985, -0.044683963575325635, -0.036911694686428805, -0.07932460322919993], \"xaxis\": \"x\", \"y\": [0.106039412140135, 0.06521785477816, -0.004399464291748, -0.0031844036766112897, 0.037562557252513, -0.0594637921340835, -0.0183053822281976, 0.0980611459027024, -0.0430187784148828, 0.0538087738618379, -0.107933235761886, -0.0114377128051263, 0.0391079361981341, 0.0727715030719605, 0.0192915851515999, -0.007734360756535009, -0.0454173469988564, 0.0785915179041593, 0.0361093027056911, -0.0105815826097926, 0.0857164277740816, 0.0572546213514705, -0.0688891823189553, 0.0114596154278772, 0.0783654038927575, 0.066358972060522, 0.0208990177695049, -0.137115297033866, 0.0156172902321442, -0.0177812740238417, -0.0564880260378318, -0.0026786776458018803, -0.0338378975242213, -0.256142720380728, -0.00684101878435677, -0.0918822135003576, -0.0474866333052684, -0.0189046450454139, 0.0169740368671499, -0.0378385331957417, -0.0215109014703824, -0.0786846496375569, -0.089950493985065, 0.0242317772445913, -0.0798279587463118, -0.0561721187820339, -0.0629564633806749, 0.0554620024115496, -0.10973477473028001, 0.0549149135120433, -0.00330911810470405, -0.0425310794030861, 0.00343947976742972, 0.0377505600572558, 0.0229678574490893, 0.0161043728293765, -0.105343130093718, -0.00997168608900377, 0.0346729997575843, -0.10082793252549199, -0.0032379121551334104, -0.0737757905866874, -0.0578603416950295, 0.0060995036624745, -0.0010437565148827, 0.0172704365769281, 0.0217120178697539, -0.0189070548696905, -0.0023676015888738897, -0.10293618640513601, 0.054633566654237, 0.0809034420798704, 0.0505074834979319, 0.0109970575589052, -0.0201640913565209, 0.0197911669719884, 0.10760336367800201, -0.0953067898831284, 0.0127158279335449, -0.0879299232518779, 0.0337475240719632, 0.0294298093071234, -0.0508544564040558, -0.0430072802586381, -0.00949174857091432, 0.00957252940953021, 0.0131248952185619, 0.0825694544628294, 0.0559785128209545, 0.00372231827392765, 0.0329810401895892, -0.04252459598035701, 0.0718759470800733, 0.0939022068688582, -0.0145276135904549, 0.0384668259431337, 0.0286416052802563, -0.0395822205872374, -0.0742552786230123, -0.0951313187600025, 0.0110860485252388, 0.0269023066976898, -0.0773581764618903, 0.0392419412770702, 0.0835299504490291, 0.0671986276988443, 0.0823973390257787, -0.117061828377013, -0.00495675222087029, 0.0618777983773445, 0.101222901143372, 0.0606271010195033, -0.0819193923475441, -0.00429034130166789, 0.051539511649676, 0.0144034031373898, 0.0817193109583082, -0.00243186192438948, 0.0519611133189414, 0.0222608416730319, -0.0260896229419643, 0.0397841750931153, 0.0389154896127699, 0.07552908964051899], \"yaxis\": \"y\"}],                        {\"legend\": {\"tracegroupgap\": 0}, \"margin\": {\"t\": 60}, \"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2d\"}], \"histogram2dcontour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2dcontour\"}], \"mesh3d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"mesh3d\"}], \"parcoords\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"parcoords\"}], \"pie\": [{\"automargin\": true, \"type\": \"pie\"}], \"scatter\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter\"}], \"scatter3d\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter3d\"}], \"scattercarpet\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattercarpet\"}], \"scattergeo\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergeo\"}], \"scattergl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergl\"}], \"scattermapbox\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattermapbox\"}], \"scatterpolar\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolar\"}], \"scatterpolargl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolargl\"}], \"scatterternary\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterternary\"}], \"surface\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"surface\"}], \"table\": [{\"cells\": {\"fill\": {\"color\": \"#EBF0F8\"}, \"line\": {\"color\": \"white\"}}, \"header\": {\"fill\": {\"color\": \"#C8D4E3\"}, \"line\": {\"color\": \"white\"}}, \"type\": \"table\"}]}, \"layout\": {\"annotationdefaults\": {\"arrowcolor\": \"#2a3f5f\", \"arrowhead\": 0, \"arrowwidth\": 1}, \"coloraxis\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"colorscale\": {\"diverging\": [[0, \"#8e0152\"], [0.1, \"#c51b7d\"], [0.2, \"#de77ae\"], [0.3, \"#f1b6da\"], [0.4, \"#fde0ef\"], [0.5, \"#f7f7f7\"], [0.6, \"#e6f5d0\"], [0.7, \"#b8e186\"], [0.8, \"#7fbc41\"], [0.9, \"#4d9221\"], [1, \"#276419\"]], \"sequential\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"sequentialminus\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"colorway\": [\"#636efa\", \"#EF553B\", \"#00cc96\", \"#ab63fa\", \"#FFA15A\", \"#19d3f3\", \"#FF6692\", \"#B6E880\", \"#FF97FF\", \"#FECB52\"], \"font\": {\"color\": \"#2a3f5f\"}, \"geo\": {\"bgcolor\": \"white\", \"lakecolor\": \"white\", \"landcolor\": \"#E5ECF6\", \"showlakes\": true, \"showland\": true, \"subunitcolor\": \"white\"}, \"hoverlabel\": {\"align\": \"left\"}, \"hovermode\": \"closest\", \"mapbox\": {\"style\": \"light\"}, \"paper_bgcolor\": \"white\", \"plot_bgcolor\": \"#E5ECF6\", \"polar\": {\"angularaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"radialaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"scene\": {\"xaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"yaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"zaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}}, \"shapedefaults\": {\"line\": {\"color\": \"#2a3f5f\"}}, \"ternary\": {\"aaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"baxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"caxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"title\": {\"x\": 0.05}, \"xaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}, \"yaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}}}, \"xaxis\": {\"anchor\": \"y\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"x\"}}, \"yaxis\": {\"anchor\": \"x\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"y\"}}},                        {\"responsive\": true}                    ).then(function(){\n",
       "                            \n",
       "var gd = document.getElementById('1f595a27-299e-4e89-a8d2-f248efb7405f');\n",
       "var x = new MutationObserver(function (mutations, observer) {{\n",
       "        var display = window.getComputedStyle(gd).display;\n",
       "        if (!display || display === 'none') {{\n",
       "            console.log([gd, 'removed!']);\n",
       "            Plotly.purge(gd);\n",
       "            observer.disconnect();\n",
       "        }}\n",
       "}});\n",
       "\n",
       "// Listen for the removal of the full notebook cells\n",
       "var notebookContainer = gd.closest('#notebook-container');\n",
       "if (notebookContainer) {{\n",
       "    x.observe(notebookContainer, {childList: true});\n",
       "}}\n",
       "\n",
       "// Listen for the clearing of the current output cell\n",
       "var outputEl = gd.closest('.output');\n",
       "if (outputEl) {{\n",
       "    x.observe(outputEl, {childList: true});\n",
       "}}\n",
       "\n",
       "                        })                };                });            </script>        </div>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "px.scatter(x=mds.samples[\"PC1\"], y=mds_coords['MDS1'])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Some looks at other methods of clustering / comparing"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>                            <div id=\"cc0e9bcb-61d7-4d96-9da6-9fc14b02d5a1\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div>            <script type=\"text/javascript\">                require([\"plotly\"], function(Plotly) {                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById(\"cc0e9bcb-61d7-4d96-9da6-9fc14b02d5a1\")) {                    Plotly.newPlot(                        \"cc0e9bcb-61d7-4d96-9da6-9fc14b02d5a1\",                        [{\"hovertemplate\": \"variable=wide_variable_0<br>index=%{x}<br>value=%{y}<extra></extra>\", \"legendgroup\": \"wide_variable_0\", \"marker\": {\"color\": \"#636efa\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"wide_variable_0\", \"orientation\": \"v\", \"showlegend\": true, \"type\": \"scatter\", \"x\": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123], \"xaxis\": \"x\", \"y\": [0.021109197720270857, -0.01837664014658623, -0.140843521402463, 0.08102445927944947, 0.049449527332954615, 0.004962635083811271, 0.07801892086646736, 0.12646541558968005, -0.12536539351688417, 0.01668810794046127, 0.014199391116910591, 0.06686129701293862, 0.05793985516678553, 0.17819482498196632, -0.08007685923326999, 0.028980734276568915, -0.007867294906013926, 0.008549750849755806, -0.015686771303147422, 0.08695189878854487, -0.00012810655806823177, 0.10025503550425459, -0.15363143990070136, 0.05800915759570328, 0.08418665661585553, 0.05997470089095331, -0.01182697738166903, 0.060859789098879485, 0.09323685589867778, -0.07523075534310102, -0.06491000365360568, -0.05897923632759626, 0.13235927645678885, -0.1907827394009301, -0.07737597638221388, -0.20252909628639193, 0.06192511443352229, 0.024441561248122596, -0.11750765861523592, 0.009003229405196088, -0.014622254408687566, 0.07508133069709372, -0.17242334252050714, -0.0019560668196467296, -0.05302807724762546, -0.026812730007731617, -0.0977282602858348, -0.09358336203928043, 0.058968424450090935, 0.010289639641151042, -0.08535666426339134, -0.07591090795988488, 0.0027552352498112437, 0.006774951472899809, -0.022910822838044593, 0.112222620215919, -0.020944647659310867, 0.0691802406641845, -0.018524004134593135, -0.045401986211448954, -0.004182427968306976, -0.10858016346877294, -0.1283803956927095, 0.08032076107988281, 0.04505343533873687, 0.06153325781236215, 0.011212319615734921, -0.048010947435528806, 0.07396985265558445, 0.012398996855797555, -0.051622785082434536, 0.02469420320132931, 0.0067264266520403225, 0.09456933116188473, -0.0036446821669491236, 0.15877822514956355, -0.0780065922425565, -0.12017312055718861, -0.003182730110727838, -0.03539741597832152, 0.09470160639299205, -0.017126827778152064, -0.021007042762385932, -0.14412215322452182, -0.010447134743683683, -0.0406094801733482, 0.11924899767891246, 0.025899907692518525, -0.00416492546619445, -0.024243614788069447, 0.05165313356284075, -0.06650804241995438, -0.053576872045383195, 0.09374035157851371, 0.0009922850834443674, -0.1333578725170949, 0.01957524266307031, 0.0646043028102434, -0.13494278885538327, 0.0071749630419629395, -0.040527223676573264, 0.04634273579380324, -0.010948726750817012, -0.0007722316491084784, 0.009087476919743332, 0.02721008046141891, -0.06228678451638514, -0.04444041243984782, 0.12995578702050176, 0.10051246179737845, 0.045089239792834426, 0.03119725362658244, 0.10761627145604216, -0.03034723446391511, -0.015673232896595776, 0.03771076921756406, -0.01530702815112051, 0.07100265461386554, -0.008772486768966576, -0.016774382120449727, -0.046588910034463145, -0.005443883767932178, 0.04266026319083237, 0.0653397200040563], \"yaxis\": \"y\"}, {\"hovertemplate\": \"variable=wide_variable_1<br>index=%{x}<br>value=%{y}<extra></extra>\", \"legendgroup\": \"wide_variable_1\", \"marker\": {\"color\": \"#EF553B\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"wide_variable_1\", \"orientation\": \"v\", \"showlegend\": true, \"type\": \"scatter\", \"x\": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123], \"xaxis\": \"x\", \"y\": [0.106039412140135, 0.06521785477816, -0.004399464291748, -0.0031844036766112897, 0.037562557252513, -0.0594637921340835, -0.0183053822281976, 0.0980611459027024, -0.0430187784148828, 0.0538087738618379, -0.107933235761886, -0.0114377128051263, 0.0391079361981341, 0.0727715030719605, 0.0192915851515999, -0.007734360756535009, -0.0454173469988564, 0.0785915179041593, 0.0361093027056911, -0.0105815826097926, 0.0857164277740816, 0.0572546213514705, -0.0688891823189553, 0.0114596154278772, 0.0783654038927575, 0.066358972060522, 0.0208990177695049, -0.137115297033866, 0.0156172902321442, -0.0177812740238417, -0.0564880260378318, -0.0026786776458018803, -0.0338378975242213, -0.256142720380728, -0.00684101878435677, -0.0918822135003576, -0.0474866333052684, -0.0189046450454139, 0.0169740368671499, -0.0378385331957417, -0.0215109014703824, -0.0786846496375569, -0.089950493985065, 0.0242317772445913, -0.0798279587463118, -0.0561721187820339, -0.0629564633806749, 0.0554620024115496, -0.10973477473028001, 0.0549149135120433, -0.00330911810470405, -0.0425310794030861, 0.00343947976742972, 0.0377505600572558, 0.0229678574490893, 0.0161043728293765, -0.105343130093718, -0.00997168608900377, 0.0346729997575843, -0.10082793252549199, -0.0032379121551334104, -0.0737757905866874, -0.0578603416950295, 0.0060995036624745, -0.0010437565148827, 0.0172704365769281, 0.0217120178697539, -0.0189070548696905, -0.0023676015888738897, -0.10293618640513601, 0.054633566654237, 0.0809034420798704, 0.0505074834979319, 0.0109970575589052, -0.0201640913565209, 0.0197911669719884, 0.10760336367800201, -0.0953067898831284, 0.0127158279335449, -0.0879299232518779, 0.0337475240719632, 0.0294298093071234, -0.0508544564040558, -0.0430072802586381, -0.00949174857091432, 0.00957252940953021, 0.0131248952185619, 0.0825694544628294, 0.0559785128209545, 0.00372231827392765, 0.0329810401895892, -0.04252459598035701, 0.0718759470800733, 0.0939022068688582, -0.0145276135904549, 0.0384668259431337, 0.0286416052802563, -0.0395822205872374, -0.0742552786230123, -0.0951313187600025, 0.0110860485252388, 0.0269023066976898, -0.0773581764618903, 0.0392419412770702, 0.0835299504490291, 0.0671986276988443, 0.0823973390257787, -0.117061828377013, -0.00495675222087029, 0.0618777983773445, 0.101222901143372, 0.0606271010195033, -0.0819193923475441, -0.00429034130166789, 0.051539511649676, 0.0144034031373898, 0.0817193109583082, -0.00243186192438948, 0.0519611133189414, 0.0222608416730319, -0.0260896229419643, 0.0397841750931153, 0.0389154896127699, 0.07552908964051899], \"yaxis\": \"y\"}],                        {\"legend\": {\"title\": {\"text\": \"variable\"}, \"tracegroupgap\": 0}, \"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2d\"}], \"histogram2dcontour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2dcontour\"}], \"mesh3d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"mesh3d\"}], \"parcoords\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"parcoords\"}], \"pie\": [{\"automargin\": true, \"type\": \"pie\"}], \"scatter\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter\"}], \"scatter3d\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter3d\"}], \"scattercarpet\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattercarpet\"}], \"scattergeo\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergeo\"}], \"scattergl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergl\"}], \"scattermapbox\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattermapbox\"}], \"scatterpolar\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolar\"}], \"scatterpolargl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolargl\"}], \"scatterternary\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterternary\"}], \"surface\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"surface\"}], \"table\": [{\"cells\": {\"fill\": {\"color\": \"#EBF0F8\"}, \"line\": {\"color\": \"white\"}}, \"header\": {\"fill\": {\"color\": \"#C8D4E3\"}, \"line\": {\"color\": \"white\"}}, \"type\": \"table\"}]}, \"layout\": {\"annotationdefaults\": {\"arrowcolor\": \"#2a3f5f\", \"arrowhead\": 0, \"arrowwidth\": 1}, \"coloraxis\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"colorscale\": {\"diverging\": [[0, \"#8e0152\"], [0.1, \"#c51b7d\"], [0.2, \"#de77ae\"], [0.3, \"#f1b6da\"], [0.4, \"#fde0ef\"], [0.5, \"#f7f7f7\"], [0.6, \"#e6f5d0\"], [0.7, \"#b8e186\"], [0.8, \"#7fbc41\"], [0.9, \"#4d9221\"], [1, \"#276419\"]], \"sequential\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"sequentialminus\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"colorway\": [\"#636efa\", \"#EF553B\", \"#00cc96\", \"#ab63fa\", \"#FFA15A\", \"#19d3f3\", \"#FF6692\", \"#B6E880\", \"#FF97FF\", \"#FECB52\"], \"font\": {\"color\": \"#2a3f5f\"}, \"geo\": {\"bgcolor\": \"white\", \"lakecolor\": \"white\", \"landcolor\": \"#E5ECF6\", \"showlakes\": true, \"showland\": true, \"subunitcolor\": \"white\"}, \"hoverlabel\": {\"align\": \"left\"}, \"hovermode\": \"closest\", \"mapbox\": {\"style\": \"light\"}, \"paper_bgcolor\": \"white\", \"plot_bgcolor\": \"#E5ECF6\", \"polar\": {\"angularaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"radialaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"scene\": {\"xaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"yaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"zaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}}, \"shapedefaults\": {\"line\": {\"color\": \"#2a3f5f\"}}, \"ternary\": {\"aaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"baxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"caxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"title\": {\"x\": 0.05}, \"xaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}, \"yaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}}}, \"title\": {\"text\": \"Blue is using Python MDS, Red is PCoA method\"}, \"xaxis\": {\"anchor\": \"y\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"index\"}}, \"yaxis\": {\"anchor\": \"x\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"value\"}}},                        {\"responsive\": true}                    ).then(function(){\n",
       "                            \n",
       "var gd = document.getElementById('cc0e9bcb-61d7-4d96-9da6-9fc14b02d5a1');\n",
       "var x = new MutationObserver(function (mutations, observer) {{\n",
       "        var display = window.getComputedStyle(gd).display;\n",
       "        if (!display || display === 'none') {{\n",
       "            console.log([gd, 'removed!']);\n",
       "            Plotly.purge(gd);\n",
       "            observer.disconnect();\n",
       "        }}\n",
       "}});\n",
       "\n",
       "// Listen for the removal of the full notebook cells\n",
       "var notebookContainer = gd.closest('#notebook-container');\n",
       "if (notebookContainer) {{\n",
       "    x.observe(notebookContainer, {childList: true});\n",
       "}}\n",
       "\n",
       "// Listen for the clearing of the current output cell\n",
       "var outputEl = gd.closest('.output');\n",
       "if (outputEl) {{\n",
       "    x.observe(outputEl, {childList: true});\n",
       "}}\n",
       "\n",
       "                        })                };                });            </script>        </div>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "embedding = MDS(n_components=10, dissimilarity=\"precomputed\", n_jobs=-1, n_init=32)\n",
    "mds = embedding.fit_transform(pc_dists)\n",
    "px.scatter(y=[mds[:,0], mds_coords['MDS1']], title=\"Blue is using Python MDS, Red is PCoA method\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Calculating PHATE...\n",
      "  Running PHATE on precomputed distance matrix with 124 observations.\n",
      "  Calculating graph and diffusion operator...\n",
      "    Calculating affinities...\n",
      "    Calculated affinities in 0.03 seconds.\n",
      "  Calculated graph and diffusion operator in 0.03 seconds.\n",
      "  Calculating optimal t...\n",
      "    Automatically selected t = 12\n",
      "  Calculated optimal t in 0.08 seconds.\n",
      "  Calculating diffusion potential...\n",
      "  Calculated diffusion potential in 0.15 seconds.\n",
      "  Calculating metric MDS...\n",
      "  Calculated metric MDS in 3.48 seconds.\n",
      "Calculated PHATE in 3.77 seconds.\n"
     ]
    }
   ],
   "source": [
    "import phate\n",
    "phater = phate.PHATE(n_components=10, knn_dist='precomputed', mds_solver='smacof', mds='metric')\n",
    "comparison_phate = phater.fit_transform(pc_dists)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>                            <div id=\"896796a7-b730-447e-9bee-19b6274781e4\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div>            <script type=\"text/javascript\">                require([\"plotly\"], function(Plotly) {                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById(\"896796a7-b730-447e-9bee-19b6274781e4\")) {                    Plotly.newPlot(                        \"896796a7-b730-447e-9bee-19b6274781e4\",                        [{\"hovertemplate\": \"variable=wide_variable_0<br>index=%{x}<br>value=%{y}<extra></extra>\", \"legendgroup\": \"wide_variable_0\", \"marker\": {\"color\": \"#636efa\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"wide_variable_0\", \"orientation\": \"v\", \"showlegend\": true, \"type\": \"scatter\", \"x\": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123], \"xaxis\": \"x\", \"y\": [0.106039412140135, 0.06521785477816, -0.004399464291748, -0.0031844036766112897, 0.037562557252513, -0.0594637921340835, -0.0183053822281976, 0.0980611459027024, -0.0430187784148828, 0.0538087738618379, -0.107933235761886, -0.0114377128051263, 0.0391079361981341, 0.0727715030719605, 0.0192915851515999, -0.007734360756535009, -0.0454173469988564, 0.0785915179041593, 0.0361093027056911, -0.0105815826097926, 0.0857164277740816, 0.0572546213514705, -0.0688891823189553, 0.0114596154278772, 0.0783654038927575, 0.066358972060522, 0.0208990177695049, -0.137115297033866, 0.0156172902321442, -0.0177812740238417, -0.0564880260378318, -0.0026786776458018803, -0.0338378975242213, -0.256142720380728, -0.00684101878435677, -0.0918822135003576, -0.0474866333052684, -0.0189046450454139, 0.0169740368671499, -0.0378385331957417, -0.0215109014703824, -0.0786846496375569, -0.089950493985065, 0.0242317772445913, -0.0798279587463118, -0.0561721187820339, -0.0629564633806749, 0.0554620024115496, -0.10973477473028001, 0.0549149135120433, -0.00330911810470405, -0.0425310794030861, 0.00343947976742972, 0.0377505600572558, 0.0229678574490893, 0.0161043728293765, -0.105343130093718, -0.00997168608900377, 0.0346729997575843, -0.10082793252549199, -0.0032379121551334104, -0.0737757905866874, -0.0578603416950295, 0.0060995036624745, -0.0010437565148827, 0.0172704365769281, 0.0217120178697539, -0.0189070548696905, -0.0023676015888738897, -0.10293618640513601, 0.054633566654237, 0.0809034420798704, 0.0505074834979319, 0.0109970575589052, -0.0201640913565209, 0.0197911669719884, 0.10760336367800201, -0.0953067898831284, 0.0127158279335449, -0.0879299232518779, 0.0337475240719632, 0.0294298093071234, -0.0508544564040558, -0.0430072802586381, -0.00949174857091432, 0.00957252940953021, 0.0131248952185619, 0.0825694544628294, 0.0559785128209545, 0.00372231827392765, 0.0329810401895892, -0.04252459598035701, 0.0718759470800733, 0.0939022068688582, -0.0145276135904549, 0.0384668259431337, 0.0286416052802563, -0.0395822205872374, -0.0742552786230123, -0.0951313187600025, 0.0110860485252388, 0.0269023066976898, -0.0773581764618903, 0.0392419412770702, 0.0835299504490291, 0.0671986276988443, 0.0823973390257787, -0.117061828377013, -0.00495675222087029, 0.0618777983773445, 0.101222901143372, 0.0606271010195033, -0.0819193923475441, -0.00429034130166789, 0.051539511649676, 0.0144034031373898, 0.0817193109583082, -0.00243186192438948, 0.0519611133189414, 0.0222608416730319, -0.0260896229419643, 0.0397841750931153, 0.0389154896127699, 0.07552908964051899], \"yaxis\": \"y\"}, {\"hovertemplate\": \"variable=wide_variable_1<br>index=%{x}<br>value=%{y}<extra></extra>\", \"legendgroup\": \"wide_variable_1\", \"marker\": {\"color\": \"#EF553B\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"wide_variable_1\", \"orientation\": \"v\", \"showlegend\": true, \"type\": \"scatter\", \"x\": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123], \"xaxis\": \"x\", \"y\": [0.10328071630058908, 0.0650479248725926, -0.007394106598915255, -0.006157734405445993, 0.030486759245616054, -0.052697883748815746, -0.019532195114048374, 0.10731489173784366, -0.045747016700497425, 0.05232496900485219, -0.10842996248618392, -0.012932329719601952, 0.04630725443312959, 0.0713363949570614, 0.0232421287307101, -0.008386021663101888, -0.045461178095005314, 0.07517237748421035, 0.0332832653482144, -0.00464769930238915, 0.09244351798292504, 0.05328536847518314, -0.06764070547396611, 0.009697491880571245, 0.07316624137339647, 0.061255843644709575, 0.020300517750714276, -0.1421031649097082, 0.026228777140329878, -0.022514796338087593, -0.06052430046525878, -0.005638655371737583, -0.03789426904973051, -0.26128388065099417, -0.011435430763923492, -0.096027993633076, -0.051979100902621214, -0.019041092443677295, 0.014928264457918042, -0.045080298703791676, -0.02157385679489578, -0.07837639643185061, -0.0936522207464769, 0.02254911945685126, -0.0811184297826174, -0.06026163221142208, -0.06135711735706212, 0.05124176546518588, -0.11034190721868777, 0.04942027722185122, -0.006800316932454283, -0.0450365793277635, -0.002580493904349241, 0.047480809630117096, 0.018229051470887193, 0.015323735519900508, -0.10491699613058116, -0.010977527633032964, 0.02905633619543364, -0.10260878154655098, 0.0007373597967201738, -0.07676325094849808, -0.059763729316446274, 0.005978345010026969, 0.004451055073261316, 0.012649239195900166, 0.018363346197186534, -0.016892193247203768, -0.0018180681629584832, -0.09286617480763365, 0.051524449155064184, 0.07652275236295818, 0.05348911734730026, 0.013909413003526622, -0.015459045289710009, 0.017182337028950622, 0.10505052960021619, -0.0962579768450507, 0.020029323812104205, -0.0874099639144895, 0.03143331440415039, 0.03386962467646718, -0.0499833273717695, -0.03602212849884945, -0.002822801181295588, 0.00977488842740034, 0.01128253169722742, 0.07758374666886007, 0.06393887161447563, 0.0005884095034402356, 0.04086179301355499, -0.04464763191980178, 0.06865312112701832, 0.09193286524055753, -0.01748611026806448, 0.04763226317586455, 0.02756224580878249, -0.03907294771166091, -0.07896282387662465, -0.09588607288563603, 0.020648615068449123, 0.023385787148913286, -0.07791160503505776, 0.03903424756155953, 0.08748900720869043, 0.0648073951032875, 0.08733205456726416, -0.11932100052943416, 0.0009908575897407317, 0.06109398053549187, 0.12669016268582342, 0.057347209767974076, -0.08037714028084723, -0.007260718834142317, 0.053458225481735525, 0.0191608345738471, 0.08699909043651556, -0.002836034415763903, 0.055844193223345606, 0.020623667595681024, -0.029100731293872795, 0.04399736659910032, 0.03621915221245034, 0.07854695911145614], \"yaxis\": \"y\"}, {\"hovertemplate\": \"variable=wide_variable_2<br>index=%{x}<br>value=%{y}<extra></extra>\", \"legendgroup\": \"wide_variable_2\", \"marker\": {\"color\": \"#00cc96\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"wide_variable_2\", \"orientation\": \"v\", \"showlegend\": true, \"type\": \"scatter\", \"x\": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123], \"xaxis\": \"x\", \"y\": [-0.06056926797135526, -0.1060181874253893, 0.11189045144851284, 0.04120403455929262, -0.05168352292247319, -0.0018604461869545696, 0.0002822861692723784, -0.08110592921726503, 0.14546677454902687, -0.06683911791488291, 0.07169090586871849, -0.03295780450877958, -0.08253122868999827, -0.05975573364693696, -0.0213877375609398, -0.013061425004231454, 0.023668299695716166, -0.03620104188599609, -0.030320386460533724, -0.06219836073395593, -0.09725519406172871, -0.06650622536274403, 0.09681389252111965, 0.011001646763309617, -0.053288874105998696, -0.0580743536627637, -0.12508096456295392, 0.04474579071152416, -0.06889537047938718, 0.04643731841676611, -0.030586150760132293, 0.025599743234770312, 0.022949330028089385, 0.05964209261284346, -0.018019141069645753, 0.08283133324121736, 0.03497774026190927, 0.07600335402066787, -0.05489181179074303, -0.021147024372476952, -0.05906685389992082, 0.12886364356643615, 0.020231954873650825, -0.07267404902530852, 0.07986994552450645, 0.05807586560241615, -0.021377495096280764, -0.09294395999849991, 0.08821991795821808, -0.05237397123268144, -0.012695977382677895, 0.05415744050134543, -0.0981507971867845, -0.0694567510421524, 0.0016686977059427377, -0.038381676142858916, 0.029597138272860514, 0.07342808097427052, -0.0753750415482498, 0.14910118523751403, 0.014898203291820088, 0.15973438729510586, 0.06331958275929384, 0.051318180980991286, 0.05488381505680136, 0.007734398425153539, -0.012365045845109193, 0.09616197082964159, 0.03424202560858837, 0.056795862210603, -0.05388312094134474, -0.03517773649493765, -0.11694219316300292, 0.018250378369000238, 0.024838249632327822, -0.019031582835563433, -0.06350996239284572, 0.12160357366882936, 0.003719815304356431, 0.0707993654692366, -0.012523078613389292, -0.0007873250897947775, -0.002245199849593208, -0.03142220706218092, 0.0713062611259112, 0.009211284011823544, 0.01111932843519301, -0.05777133525437652, -0.043278218898073616, -0.053600537898955754, -0.015905204633425565, 0.022932337142975046, -0.06720603388225362, -0.053732821494935336, 0.06298153034432075, -0.05156816586633682, 0.014227715996664258, 0.08525338440785028, 0.16519826842042193, 0.023545349433283264, 0.020850310021541175, -0.002673996050669005, 0.1610260026132015, -0.03850242312986798, -0.06437338027881655, -0.03597189436837072, -0.058611702605321316, 0.043151421169382025, 0.04240177962926328, -0.07762946779203818, -0.09339160844811084, -0.0397636688912339, 0.03417347439653358, 0.040026001381194214, -0.06428822298075097, 0.06499995546960693, -0.0600204490992228, 0.04417884490163, -0.08286654779349349, -0.01975080510230213, 0.048808094337651015, -0.046534921333224115, -0.0040978627739658305, -0.049951422682925364], \"yaxis\": \"y\"}],                        {\"legend\": {\"title\": {\"text\": \"variable\"}, \"tracegroupgap\": 0}, \"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2d\"}], \"histogram2dcontour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2dcontour\"}], \"mesh3d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"mesh3d\"}], \"parcoords\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"parcoords\"}], \"pie\": [{\"automargin\": true, \"type\": \"pie\"}], \"scatter\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter\"}], \"scatter3d\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter3d\"}], \"scattercarpet\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattercarpet\"}], \"scattergeo\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergeo\"}], \"scattergl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergl\"}], \"scattermapbox\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattermapbox\"}], \"scatterpolar\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolar\"}], \"scatterpolargl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolargl\"}], \"scatterternary\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterternary\"}], \"surface\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"surface\"}], \"table\": [{\"cells\": {\"fill\": {\"color\": \"#EBF0F8\"}, \"line\": {\"color\": \"white\"}}, \"header\": {\"fill\": {\"color\": \"#C8D4E3\"}, \"line\": {\"color\": \"white\"}}, \"type\": \"table\"}]}, \"layout\": {\"annotationdefaults\": {\"arrowcolor\": \"#2a3f5f\", \"arrowhead\": 0, \"arrowwidth\": 1}, \"coloraxis\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"colorscale\": {\"diverging\": [[0, \"#8e0152\"], [0.1, \"#c51b7d\"], [0.2, \"#de77ae\"], [0.3, \"#f1b6da\"], [0.4, \"#fde0ef\"], [0.5, \"#f7f7f7\"], [0.6, \"#e6f5d0\"], [0.7, \"#b8e186\"], [0.8, \"#7fbc41\"], [0.9, \"#4d9221\"], [1, \"#276419\"]], \"sequential\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"sequentialminus\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"colorway\": [\"#636efa\", \"#EF553B\", \"#00cc96\", \"#ab63fa\", \"#FFA15A\", \"#19d3f3\", \"#FF6692\", \"#B6E880\", \"#FF97FF\", \"#FECB52\"], \"font\": {\"color\": \"#2a3f5f\"}, \"geo\": {\"bgcolor\": \"white\", \"lakecolor\": \"white\", \"landcolor\": \"#E5ECF6\", \"showlakes\": true, \"showland\": true, \"subunitcolor\": \"white\"}, \"hoverlabel\": {\"align\": \"left\"}, \"hovermode\": \"closest\", \"mapbox\": {\"style\": \"light\"}, \"paper_bgcolor\": \"white\", \"plot_bgcolor\": \"#E5ECF6\", \"polar\": {\"angularaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"radialaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"scene\": {\"xaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"yaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"zaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}}, \"shapedefaults\": {\"line\": {\"color\": \"#2a3f5f\"}}, \"ternary\": {\"aaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"baxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"caxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"title\": {\"x\": 0.05}, \"xaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}, \"yaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}}}, \"title\": {\"text\": \"Green is PHATE\"}, \"xaxis\": {\"anchor\": \"y\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"index\"}}, \"yaxis\": {\"anchor\": \"x\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"value\"}}},                        {\"responsive\": true}                    ).then(function(){\n",
       "                            \n",
       "var gd = document.getElementById('896796a7-b730-447e-9bee-19b6274781e4');\n",
       "var x = new MutationObserver(function (mutations, observer) {{\n",
       "        var display = window.getComputedStyle(gd).display;\n",
       "        if (!display || display === 'none') {{\n",
       "            console.log([gd, 'removed!']);\n",
       "            Plotly.purge(gd);\n",
       "            observer.disconnect();\n",
       "        }}\n",
       "}});\n",
       "\n",
       "// Listen for the removal of the full notebook cells\n",
       "var notebookContainer = gd.closest('#notebook-container');\n",
       "if (notebookContainer) {{\n",
       "    x.observe(notebookContainer, {childList: true});\n",
       "}}\n",
       "\n",
       "// Listen for the clearing of the current output cell\n",
       "var outputEl = gd.closest('.output');\n",
       "if (outputEl) {{\n",
       "    x.observe(outputEl, {childList: true});\n",
       "}}\n",
       "\n",
       "                        })                };                });            </script>        </div>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "mds = pcoa(pc_dists)\n",
    "px.scatter(y=[mds_coords['MDS1'], mds.samples[\"PC1\"], comparison_phate[:,0]], title=\"Green is PHATE\")\n",
    "# https://github.com/KrishnaswamyLab/PHATE\n",
    "# Moon, van Dijk, Wang, Gigante et al. Visualizing Transitions and Structure for Biological Data Exploration. 2019. Nature Biotechnology."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>                            <div id=\"df9b40ec-0773-4b42-bd2a-a7a8d5462fa0\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div>            <script type=\"text/javascript\">                require([\"plotly\"], function(Plotly) {                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById(\"df9b40ec-0773-4b42-bd2a-a7a8d5462fa0\")) {                    Plotly.newPlot(                        \"df9b40ec-0773-4b42-bd2a-a7a8d5462fa0\",                        [{\"hovertemplate\": \"x=%{x}<br>y=%{y}<extra></extra>\", \"legendgroup\": \"\", \"marker\": {\"color\": \"#636efa\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"\", \"orientation\": \"v\", \"showlegend\": false, \"type\": \"scatter\", \"x\": [17.263975143432617, 17.126901626586914, 14.787139892578125, 16.37992286682129, 15.444764137268066, 14.316938400268555, 13.796233177185059, 17.95369529724121, 14.080698013305664, 17.945188522338867, 13.273980140686035, 17.41141128540039, 17.99390983581543, 18.099767684936523, 17.587278366088867, 14.366996765136719, 14.732986450195312, 17.033056259155273, 17.62986946105957, 13.664259910583496, 17.66584587097168, 15.85737419128418, 13.521018981933594, 15.342313766479492, 16.917150497436523, 16.538156509399414, 14.622108459472656, 12.652647972106934, 14.642333984375, 14.138087272644043, 13.954416275024414, 15.403928756713867, 13.773552894592285, 12.521588325500488, 15.197176933288574, 12.766664505004883, 14.285577774047852, 14.343229293823242, 15.713179588317871, 12.347594261169434, 12.447623252868652, 13.423230171203613, 12.588674545288086, 17.661645889282227, 12.934277534484863, 14.133136749267578, 14.191749572753906, 15.967666625976562, 13.408391952514648, 15.673920631408691, 14.332277297973633, 15.05550479888916, 15.245094299316406, 17.878585815429688, 16.792373657226562, 13.620634078979492, 12.550223350524902, 13.916744232177734, 15.974055290222168, 13.46324348449707, 15.466361999511719, 13.626177787780762, 13.996156692504883, 15.82894515991211, 15.352368354797363, 14.999058723449707, 16.025754928588867, 14.713495254516602, 16.222028732299805, 13.293981552124023, 16.240615844726562, 17.1163272857666, 15.933274269104004, 16.42012596130371, 15.143298149108887, 14.70059585571289, 16.331819534301758, 13.550545692443848, 14.986318588256836, 13.904945373535156, 16.887935638427734, 15.28495979309082, 13.967894554138184, 14.208776473999023, 16.240612030029297, 16.133581161499023, 16.40119743347168, 16.664907455444336, 16.784639358520508, 15.577574729919434, 16.2913875579834, 13.787817001342773, 16.99203109741211, 17.99152374267578, 16.079946517944336, 15.730192184448242, 15.834941864013672, 13.686531066894531, 13.040035247802734, 13.335514068603516, 14.82520866394043, 17.297353744506836, 13.843733787536621, 17.586931228637695, 17.86428451538086, 17.36171531677246, 17.763591766357422, 12.928730010986328, 16.188522338867188, 17.64701271057129, 16.87864112854004, 17.32903289794922, 12.974961280822754, 14.637401580810547, 16.144880294799805, 14.344196319580078, 17.787107467651367, 15.66732120513916, 17.855510711669922, 15.107294082641602, 14.69983959197998, 17.673044204711914, 16.515527725219727, 16.081789016723633], \"xaxis\": \"x\", \"y\": [-4.829557418823242, -2.990713357925415, -4.499377727508545, -6.423913955688477, -2.649688243865967, -2.653259038925171, -2.0475757122039795, -3.530651330947876, -4.086768627166748, -5.221822738647461, -4.099832057952881, -3.5312585830688477, -3.7618649005889893, -3.9781761169433594, -5.585751056671143, -2.783449172973633, -3.0674095153808594, -4.011992931365967, -4.7970356941223145, -1.7820219993591309, -4.361521244049072, -3.256253719329834, -3.0984277725219727, -5.152871131896973, -3.812993049621582, -3.6632609367370605, -1.8873870372772217, -1.9489649534225464, -2.4407613277435303, -3.507453441619873, -2.4999892711639404, -3.638641119003296, -2.1094555854797363, -2.056532621383667, -4.275726795196533, -2.923772096633911, -2.5119290351867676, -4.8722825050354, -4.064469337463379, -1.796926498413086, -1.9711781740188599, -4.688515663146973, -2.3140616416931152, -3.8536109924316406, -2.8109214305877686, -3.908914566040039, -2.8656599521636963, -2.822728157043457, -4.341987133026123, -2.7871458530426025, -1.8742337226867676, -4.873852252960205, -2.3967251777648926, -4.578311443328857, -5.653161525726318, -1.942092776298523, -2.100989580154419, -5.316225528717041, -3.1432881355285645, -4.491766929626465, -5.338269233703613, -4.029970645904541, -4.116971492767334, -6.022326469421387, -5.977461338043213, -2.8335065841674805, -3.4337003231048584, -4.804609298706055, -6.240355491638184, -2.31038498878479, -4.8380866050720215, -4.923981666564941, -2.450298309326172, -5.837591171264648, -5.293158531188965, -2.6605775356292725, -4.702849864959717, -3.8015456199645996, -5.364895820617676, -4.79890251159668, -5.213852882385254, -4.374375343322754, -3.316049814224243, -3.070333242416382, -6.482368469238281, -5.208238124847412, -6.065159797668457, -4.064723491668701, -4.282857894897461, -3.4179391860961914, -5.529538154602051, -3.172597646713257, -4.426131725311279, -4.726842403411865, -6.265873432159424, -4.667121410369873, -5.577372074127197, -5.089409351348877, -3.2742085456848145, -2.3761794567108154, -3.9656448364257812, -5.515689849853516, -4.507173538208008, -5.12343692779541, -5.263431549072266, -4.6768388748168945, -5.325929641723633, -2.233616828918457, -6.437081813812256, -3.285338878631592, -2.9853925704956055, -3.3542940616607666, -1.9347554445266724, -4.216066837310791, -2.8915348052978516, -5.466610431671143, -5.2326884269714355, -5.62516975402832, -4.376175880432129, -3.4513227939605713, -5.238507270812988, -5.241288661956787, -5.348576545715332, -3.7018189430236816], \"yaxis\": \"y\"}],                        {\"legend\": {\"tracegroupgap\": 0}, \"margin\": {\"t\": 60}, \"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2d\"}], \"histogram2dcontour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2dcontour\"}], \"mesh3d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"mesh3d\"}], \"parcoords\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"parcoords\"}], \"pie\": [{\"automargin\": true, \"type\": \"pie\"}], \"scatter\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter\"}], \"scatter3d\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter3d\"}], \"scattercarpet\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattercarpet\"}], \"scattergeo\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergeo\"}], \"scattergl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergl\"}], \"scattermapbox\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattermapbox\"}], \"scatterpolar\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolar\"}], \"scatterpolargl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolargl\"}], \"scatterternary\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterternary\"}], \"surface\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"surface\"}], \"table\": [{\"cells\": {\"fill\": {\"color\": \"#EBF0F8\"}, \"line\": {\"color\": \"white\"}}, \"header\": {\"fill\": {\"color\": \"#C8D4E3\"}, \"line\": {\"color\": \"white\"}}, \"type\": \"table\"}]}, \"layout\": {\"annotationdefaults\": {\"arrowcolor\": \"#2a3f5f\", \"arrowhead\": 0, \"arrowwidth\": 1}, \"coloraxis\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"colorscale\": {\"diverging\": [[0, \"#8e0152\"], [0.1, \"#c51b7d\"], [0.2, \"#de77ae\"], [0.3, \"#f1b6da\"], [0.4, \"#fde0ef\"], [0.5, \"#f7f7f7\"], [0.6, \"#e6f5d0\"], [0.7, \"#b8e186\"], [0.8, \"#7fbc41\"], [0.9, \"#4d9221\"], [1, \"#276419\"]], \"sequential\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"sequentialminus\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"colorway\": [\"#636efa\", \"#EF553B\", \"#00cc96\", \"#ab63fa\", \"#FFA15A\", \"#19d3f3\", \"#FF6692\", \"#B6E880\", \"#FF97FF\", \"#FECB52\"], \"font\": {\"color\": \"#2a3f5f\"}, \"geo\": {\"bgcolor\": \"white\", \"lakecolor\": \"white\", \"landcolor\": \"#E5ECF6\", \"showlakes\": true, \"showland\": true, \"subunitcolor\": \"white\"}, \"hoverlabel\": {\"align\": \"left\"}, \"hovermode\": \"closest\", \"mapbox\": {\"style\": \"light\"}, \"paper_bgcolor\": \"white\", \"plot_bgcolor\": \"#E5ECF6\", \"polar\": {\"angularaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"radialaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"scene\": {\"xaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"yaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"zaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}}, \"shapedefaults\": {\"line\": {\"color\": \"#2a3f5f\"}}, \"ternary\": {\"aaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"baxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"caxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"title\": {\"x\": 0.05}, \"xaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}, \"yaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}}}, \"xaxis\": {\"anchor\": \"y\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"x\"}}, \"yaxis\": {\"anchor\": \"x\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"y\"}}},                        {\"responsive\": true}                    ).then(function(){\n",
       "                            \n",
       "var gd = document.getElementById('df9b40ec-0773-4b42-bd2a-a7a8d5462fa0');\n",
       "var x = new MutationObserver(function (mutations, observer) {{\n",
       "        var display = window.getComputedStyle(gd).display;\n",
       "        if (!display || display === 'none') {{\n",
       "            console.log([gd, 'removed!']);\n",
       "            Plotly.purge(gd);\n",
       "            observer.disconnect();\n",
       "        }}\n",
       "}});\n",
       "\n",
       "// Listen for the removal of the full notebook cells\n",
       "var notebookContainer = gd.closest('#notebook-container');\n",
       "if (notebookContainer) {{\n",
       "    x.observe(notebookContainer, {childList: true});\n",
       "}}\n",
       "\n",
       "// Listen for the clearing of the current output cell\n",
       "var outputEl = gd.closest('.output');\n",
       "if (outputEl) {{\n",
       "    x.observe(outputEl, {childList: true});\n",
       "}}\n",
       "\n",
       "                        })                };                });            </script>        </div>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "reducer = umap.UMAP()\n",
    "embedding = reducer.fit_transform(pc_dists)\n",
    "px.scatter(x=embedding[:, 0], y=embedding[:, 1])\n",
    "# UMAP: https://umap-learn.readthedocs.io/en/latest/index.html\n",
    "# McInnes, L, Healy, J, UMAP: Uniform Manifold Approximation and Projection for Dimension Reduction, ArXiv e-prints 1802.03426, 2018"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>                            <div id=\"8ca85e81-20e9-4652-8638-2baca5a0d74c\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div>            <script type=\"text/javascript\">                require([\"plotly\"], function(Plotly) {                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById(\"8ca85e81-20e9-4652-8638-2baca5a0d74c\")) {                    Plotly.newPlot(                        \"8ca85e81-20e9-4652-8638-2baca5a0d74c\",                        [{\"hovertemplate\": \"x=%{x}<br>y=%{y}<br>color=%{marker.color}<extra></extra>\", \"legendgroup\": \"\", \"marker\": {\"color\": [4, -1, 5, 5, 1, 2, -1, -1, 0, 4, -1, -1, -1, -1, 4, 2, -1, -1, 4, -1, 4, 1, -1, -1, -1, -1, -1, 3, -1, 0, 2, -1, 2, 3, -1, -1, 2, -1, -1, -1, 3, 0, 3, 4, -1, -1, 2, 1, 0, 1, -1, 5, -1, -1, 5, 2, 3, -1, 1, 0, 5, 0, 0, 5, -1, -1, -1, -1, 5, 2, -1, 4, -1, 5, 5, 2, -1, -1, 5, 0, -1, -1, 2, 2, 5, -1, 5, 4, -1, 1, 5, 2, 4, 4, 5, -1, 5, -1, -1, -1, -1, 4, 0, 4, 4, 4, 4, 3, 5, -1, -1, -1, 3, -1, 1, -1, 4, -1, 4, -1, 5, 4, 5, -1], \"coloraxis\": \"coloraxis\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"\", \"orientation\": \"v\", \"showlegend\": false, \"type\": \"scatter\", \"x\": [17.263975143432617, 17.126901626586914, 14.787139892578125, 16.37992286682129, 15.444764137268066, 14.316938400268555, 13.796233177185059, 17.95369529724121, 14.080698013305664, 17.945188522338867, 13.273980140686035, 17.41141128540039, 17.99390983581543, 18.099767684936523, 17.587278366088867, 14.366996765136719, 14.732986450195312, 17.033056259155273, 17.62986946105957, 13.664259910583496, 17.66584587097168, 15.85737419128418, 13.521018981933594, 15.342313766479492, 16.917150497436523, 16.538156509399414, 14.622108459472656, 12.652647972106934, 14.642333984375, 14.138087272644043, 13.954416275024414, 15.403928756713867, 13.773552894592285, 12.521588325500488, 15.197176933288574, 12.766664505004883, 14.285577774047852, 14.343229293823242, 15.713179588317871, 12.347594261169434, 12.447623252868652, 13.423230171203613, 12.588674545288086, 17.661645889282227, 12.934277534484863, 14.133136749267578, 14.191749572753906, 15.967666625976562, 13.408391952514648, 15.673920631408691, 14.332277297973633, 15.05550479888916, 15.245094299316406, 17.878585815429688, 16.792373657226562, 13.620634078979492, 12.550223350524902, 13.916744232177734, 15.974055290222168, 13.46324348449707, 15.466361999511719, 13.626177787780762, 13.996156692504883, 15.82894515991211, 15.352368354797363, 14.999058723449707, 16.025754928588867, 14.713495254516602, 16.222028732299805, 13.293981552124023, 16.240615844726562, 17.1163272857666, 15.933274269104004, 16.42012596130371, 15.143298149108887, 14.70059585571289, 16.331819534301758, 13.550545692443848, 14.986318588256836, 13.904945373535156, 16.887935638427734, 15.28495979309082, 13.967894554138184, 14.208776473999023, 16.240612030029297, 16.133581161499023, 16.40119743347168, 16.664907455444336, 16.784639358520508, 15.577574729919434, 16.2913875579834, 13.787817001342773, 16.99203109741211, 17.99152374267578, 16.079946517944336, 15.730192184448242, 15.834941864013672, 13.686531066894531, 13.040035247802734, 13.335514068603516, 14.82520866394043, 17.297353744506836, 13.843733787536621, 17.586931228637695, 17.86428451538086, 17.36171531677246, 17.763591766357422, 12.928730010986328, 16.188522338867188, 17.64701271057129, 16.87864112854004, 17.32903289794922, 12.974961280822754, 14.637401580810547, 16.144880294799805, 14.344196319580078, 17.787107467651367, 15.66732120513916, 17.855510711669922, 15.107294082641602, 14.69983959197998, 17.673044204711914, 16.515527725219727, 16.081789016723633], \"xaxis\": \"x\", \"y\": [-4.829557418823242, -2.990713357925415, -4.499377727508545, -6.423913955688477, -2.649688243865967, -2.653259038925171, -2.0475757122039795, -3.530651330947876, -4.086768627166748, -5.221822738647461, -4.099832057952881, -3.5312585830688477, -3.7618649005889893, -3.9781761169433594, -5.585751056671143, -2.783449172973633, -3.0674095153808594, -4.011992931365967, -4.7970356941223145, -1.7820219993591309, -4.361521244049072, -3.256253719329834, -3.0984277725219727, -5.152871131896973, -3.812993049621582, -3.6632609367370605, -1.8873870372772217, -1.9489649534225464, -2.4407613277435303, -3.507453441619873, -2.4999892711639404, -3.638641119003296, -2.1094555854797363, -2.056532621383667, -4.275726795196533, -2.923772096633911, -2.5119290351867676, -4.8722825050354, -4.064469337463379, -1.796926498413086, -1.9711781740188599, -4.688515663146973, -2.3140616416931152, -3.8536109924316406, -2.8109214305877686, -3.908914566040039, -2.8656599521636963, -2.822728157043457, -4.341987133026123, -2.7871458530426025, -1.8742337226867676, -4.873852252960205, -2.3967251777648926, -4.578311443328857, -5.653161525726318, -1.942092776298523, -2.100989580154419, -5.316225528717041, -3.1432881355285645, -4.491766929626465, -5.338269233703613, -4.029970645904541, -4.116971492767334, -6.022326469421387, -5.977461338043213, -2.8335065841674805, -3.4337003231048584, -4.804609298706055, -6.240355491638184, -2.31038498878479, -4.8380866050720215, -4.923981666564941, -2.450298309326172, -5.837591171264648, -5.293158531188965, -2.6605775356292725, -4.702849864959717, -3.8015456199645996, -5.364895820617676, -4.79890251159668, -5.213852882385254, -4.374375343322754, -3.316049814224243, -3.070333242416382, -6.482368469238281, -5.208238124847412, -6.065159797668457, -4.064723491668701, -4.282857894897461, -3.4179391860961914, -5.529538154602051, -3.172597646713257, -4.426131725311279, -4.726842403411865, -6.265873432159424, -4.667121410369873, -5.577372074127197, -5.089409351348877, -3.2742085456848145, -2.3761794567108154, -3.9656448364257812, -5.515689849853516, -4.507173538208008, -5.12343692779541, -5.263431549072266, -4.6768388748168945, -5.325929641723633, -2.233616828918457, -6.437081813812256, -3.285338878631592, -2.9853925704956055, -3.3542940616607666, -1.9347554445266724, -4.216066837310791, -2.8915348052978516, -5.466610431671143, -5.2326884269714355, -5.62516975402832, -4.376175880432129, -3.4513227939605713, -5.238507270812988, -5.241288661956787, -5.348576545715332, -3.7018189430236816], \"yaxis\": \"y\"}],                        {\"coloraxis\": {\"colorbar\": {\"title\": {\"text\": \"color\"}}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"legend\": {\"tracegroupgap\": 0}, \"margin\": {\"t\": 60}, \"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2d\"}], \"histogram2dcontour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2dcontour\"}], \"mesh3d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"mesh3d\"}], \"parcoords\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"parcoords\"}], \"pie\": [{\"automargin\": true, \"type\": \"pie\"}], \"scatter\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter\"}], \"scatter3d\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter3d\"}], \"scattercarpet\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattercarpet\"}], \"scattergeo\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergeo\"}], \"scattergl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergl\"}], \"scattermapbox\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattermapbox\"}], \"scatterpolar\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolar\"}], \"scatterpolargl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolargl\"}], \"scatterternary\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterternary\"}], \"surface\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"surface\"}], \"table\": [{\"cells\": {\"fill\": {\"color\": \"#EBF0F8\"}, \"line\": {\"color\": \"white\"}}, \"header\": {\"fill\": {\"color\": \"#C8D4E3\"}, \"line\": {\"color\": \"white\"}}, \"type\": \"table\"}]}, \"layout\": {\"annotationdefaults\": {\"arrowcolor\": \"#2a3f5f\", \"arrowhead\": 0, \"arrowwidth\": 1}, \"coloraxis\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"colorscale\": {\"diverging\": [[0, \"#8e0152\"], [0.1, \"#c51b7d\"], [0.2, \"#de77ae\"], [0.3, \"#f1b6da\"], [0.4, \"#fde0ef\"], [0.5, \"#f7f7f7\"], [0.6, \"#e6f5d0\"], [0.7, \"#b8e186\"], [0.8, \"#7fbc41\"], [0.9, \"#4d9221\"], [1, \"#276419\"]], \"sequential\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"sequentialminus\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"colorway\": [\"#636efa\", \"#EF553B\", \"#00cc96\", \"#ab63fa\", \"#FFA15A\", \"#19d3f3\", \"#FF6692\", \"#B6E880\", \"#FF97FF\", \"#FECB52\"], \"font\": {\"color\": \"#2a3f5f\"}, \"geo\": {\"bgcolor\": \"white\", \"lakecolor\": \"white\", \"landcolor\": \"#E5ECF6\", \"showlakes\": true, \"showland\": true, \"subunitcolor\": \"white\"}, \"hoverlabel\": {\"align\": \"left\"}, \"hovermode\": \"closest\", \"mapbox\": {\"style\": \"light\"}, \"paper_bgcolor\": \"white\", \"plot_bgcolor\": \"#E5ECF6\", \"polar\": {\"angularaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"radialaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"scene\": {\"xaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"yaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"zaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}}, \"shapedefaults\": {\"line\": {\"color\": \"#2a3f5f\"}}, \"ternary\": {\"aaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"baxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"caxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"title\": {\"x\": 0.05}, \"xaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}, \"yaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}}}, \"xaxis\": {\"anchor\": \"y\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"x\"}}, \"yaxis\": {\"anchor\": \"x\", \"domain\": [0.0, 1.0], \"title\": {\"text\": \"y\"}}},                        {\"responsive\": true}                    ).then(function(){\n",
       "                            \n",
       "var gd = document.getElementById('8ca85e81-20e9-4652-8638-2baca5a0d74c');\n",
       "var x = new MutationObserver(function (mutations, observer) {{\n",
       "        var display = window.getComputedStyle(gd).display;\n",
       "        if (!display || display === 'none') {{\n",
       "            console.log([gd, 'removed!']);\n",
       "            Plotly.purge(gd);\n",
       "            observer.disconnect();\n",
       "        }}\n",
       "}});\n",
       "\n",
       "// Listen for the removal of the full notebook cells\n",
       "var notebookContainer = gd.closest('#notebook-container');\n",
       "if (notebookContainer) {{\n",
       "    x.observe(notebookContainer, {childList: true});\n",
       "}}\n",
       "\n",
       "// Listen for the clearing of the current output cell\n",
       "var outputEl = gd.closest('.output');\n",
       "if (outputEl) {{\n",
       "    x.observe(outputEl, {childList: true});\n",
       "}}\n",
       "\n",
       "                        })                };                });            </script>        </div>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "hdbscan_labels = hdbscan.HDBSCAN().fit_predict(embedding)\n",
    "px.scatter(x=embedding[:, 0], y=embedding[:, 1], color=hdbscan_labels)\n",
    "# hdbscan: https://hdbscan.readthedocs.io/en/latest/index.html"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>                            <div id=\"ff3f6035-6094-46d4-a719-23749abd3072\" class=\"plotly-graph-div\" style=\"height:600px; width:800px;\"></div>            <script type=\"text/javascript\">                require([\"plotly\"], function(Plotly) {                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById(\"ff3f6035-6094-46d4-a719-23749abd3072\")) {                    Plotly.newPlot(                        \"ff3f6035-6094-46d4-a719-23749abd3072\",                        [{\"hovertemplate\": \"x=%{x}<br>y=%{y}<br>z=%{z}<br>color=%{marker.color}<extra></extra>\", \"legendgroup\": \"\", \"marker\": {\"color\": [0, -1, -1, 0, -1, 2, 2, 0, -1, 0, 1, 0, 0, 0, 0, 2, 2, 0, 0, 2, 0, 2, 2, 0, 0, -1, -1, 2, 2, -1, 2, 2, 2, 2, 0, 2, 2, -1, -1, 2, 2, 1, 2, -1, 2, 1, 2, 2, -1, -1, -1, 0, -1, 0, 0, 2, 2, -1, -1, 1, 0, 1, 1, 0, -1, 2, -1, 0, 0, 2, -1, 0, -1, 0, 0, 2, -1, 1, 0, 1, 0, -1, -1, 2, 0, -1, 0, 0, -1, 2, 0, 1, 0, 0, 0, -1, 0, -1, -1, 2, -1, 0, 1, 0, 0, 0, 0, 2, 0, 0, -1, 0, 2, -1, 2, -1, 0, 0, 0, -1, 0, 0, -1, 2], \"coloraxis\": \"coloraxis\", \"symbol\": \"circle\"}, \"mode\": \"markers\", \"name\": \"\", \"scene\": \"scene\", \"showlegend\": false, \"type\": \"scatter3d\", \"x\": [15.165105819702148, 14.721980094909668, 15.148390769958496, 15.957006454467773, 13.555976867675781, 13.081850051879883, 12.651151657104492, 15.011927604675293, 14.398255348205566, 16.097997665405273, 13.758798599243164, 15.291520118713379, 15.327096939086914, 15.387202262878418, 16.12080192565918, 13.22037410736084, 13.569289207458496, 14.617884635925293, 15.356170654296875, 12.308085441589355, 15.171027183532715, 14.411093711853027, 13.32772445678711, 15.071764945983887, 14.532516479492188, 14.20139217376709, 13.2727689743042, 12.355978012084961, 13.1388521194458, 13.680773735046387, 12.826220512390137, 14.184479713439941, 12.435140609741211, 12.117412567138672, 15.275208473205566, 12.972349166870117, 12.936544418334961, 14.878032684326172, 15.337447166442871, 12.042606353759766, 12.047592163085938, 13.893656730651855, 12.500151634216309, 15.593404769897461, 12.9308443069458, 14.2156982421875, 13.373466491699219, 14.642309188842773, 13.529749870300293, 13.547032356262207, 12.994909286499023, 14.994312286376953, 13.264091491699219, 15.72818660736084, 15.824971199035645, 12.355236053466797, 12.31771183013916, 14.212202072143555, 14.816195487976074, 14.087346076965332, 15.553874969482422, 14.083636283874512, 13.95092487335205, 15.680330276489258, 14.931772232055664, 13.372459411621094, 13.979388236999512, 15.22249698638916, 15.748554229736328, 12.689469337463379, 15.79835319519043, 15.1255464553833, 14.119734764099121, 15.487380027770996, 15.142559051513672, 13.059198379516602, 15.650071144104004, 13.78557300567627, 15.400734901428223, 14.18730640411377, 15.340896606445312, 15.041699409484863, 13.816818237304688, 13.43665885925293, 15.86791706085205, 15.653206825256348, 15.74785041809082, 14.502787590026855, 14.433738708496094, 14.249735832214355, 15.843510627746582, 13.51693058013916, 14.722197532653809, 15.60735034942627, 15.619284629821777, 15.379243850708008, 15.654315948486328, 13.851936340332031, 13.236791610717773, 12.646854400634766, 14.672816276550293, 16.223230361938477, 14.20414924621582, 15.875707626342773, 16.2030086517334, 15.594736099243164, 16.07665252685547, 12.552634239196777, 15.850981712341309, 14.86435604095459, 14.508055686950684, 14.768087387084961, 12.33700942993164, 14.582849502563477, 13.841696739196777, 14.420750617980957, 16.010679244995117, 15.30029582977295, 15.557374954223633, 14.314966201782227, 15.365557670593262, 16.25404930114746, 15.218435287475586, 14.851573944091797], \"y\": [5.846977710723877, 4.393745422363281, 3.686251640319824, 6.234107971191406, 4.869058609008789, 3.555405378341675, 3.079819440841675, 5.162036418914795, 3.3718366622924805, 5.5493550300598145, 3.591871738433838, 4.7292962074279785, 5.155117511749268, 5.400811672210693, 4.966224670410156, 3.6456680297851562, 3.804276466369629, 5.610300540924072, 5.856230735778809, 3.0244646072387695, 5.462818622589111, 4.0846099853515625, 3.0671749114990234, 4.914121627807617, 5.424079895019531, 5.2037835121154785, 3.0564377307891846, 2.679887533187866, 3.5384206771850586, 4.119826793670654, 3.3403584957122803, 4.256275653839111, 3.2187533378601074, 2.561072826385498, 3.9630231857299805, 2.9737298488616943, 3.8482003211975098, 3.954085350036621, 3.876962423324585, 2.5834126472473145, 2.555432081222534, 3.9751040935516357, 2.718209743499756, 4.87994384765625, 3.1451728343963623, 3.758294105529785, 3.3806307315826416, 3.6288204193115234, 3.941743850708008, 4.7954206466674805, 2.839569568634033, 4.582312107086182, 4.474114418029785, 5.484417915344238, 5.750809192657471, 3.107501745223999, 2.7044553756713867, 4.707592964172363, 3.7563648223876953, 3.7146172523498535, 4.544684410095215, 3.333322286605835, 3.8992621898651123, 5.5474348068237305, 5.515379905700684, 4.307305335998535, 4.427003860473633, 4.065670013427734, 6.120246887207031, 3.172576665878296, 4.769057273864746, 5.675740718841553, 3.495882272720337, 5.954397678375244, 4.755242824554443, 3.927877902984619, 4.676907062530518, 3.2647693157196045, 4.820232391357422, 4.284767150878906, 5.886917591094971, 3.980574369430542, 3.392077684402466, 3.545541763305664, 6.2309651374816895, 4.9831953048706055, 5.908339500427246, 5.354097843170166, 5.488273620605469, 4.131989479064941, 5.381890296936035, 3.7941911220550537, 5.611340522766113, 5.842710018157959, 6.138561725616455, 4.225996971130371, 5.204071521759033, 4.533850193023682, 3.1142096519470215, 3.2699477672576904, 3.720141887664795, 5.501687049865723, 3.625711679458618, 5.679021835327148, 5.24368143081665, 5.925483226776123, 5.119997501373291, 2.757941246032715, 5.9540181159973145, 4.741522789001465, 4.530523777008057, 4.938569068908691, 2.7861273288726807, 3.997387170791626, 4.676447868347168, 5.139889240264893, 5.718199729919434, 5.327856063842773, 5.33447790145874, 3.639446258544922, 4.561180591583252, 5.620377063751221, 5.665407657623291, 4.193979740142822], \"z\": [1.77875816822052, 0.6514879465103149, 3.107429265975952, 2.964613199234009, 1.8313606977462769, 1.8831764459609985, 1.808862328529358, 0.5537503957748413, 3.169466733932495, 1.423471212387085, 3.7153477668762207, 1.0005388259887695, 0.6945117712020874, 0.7626186609268188, 1.5146523714065552, 2.1342904567718506, 1.7594075202941895, 1.4193339347839355, 1.5190098285675049, 2.2377371788024902, 1.1642200946807861, 1.3558166027069092, 2.7823219299316406, 3.0689618587493896, 1.3275882005691528, 1.5280249118804932, 1.5117243528366089, 2.6892783641815186, 1.4570859670639038, 2.9358582496643066, 2.098252773284912, 1.5496798753738403, 2.0558125972747803, 2.98972749710083, 2.878629446029663, 3.388805866241455, 1.9515540599822998, 3.8108060359954834, 2.083859920501709, 2.8989391326904297, 2.9594900608062744, 3.9784040451049805, 3.1095311641693115, 0.9731315970420837, 3.2946815490722656, 3.1419405937194824, 2.1218552589416504, 1.6853784322738647, 3.689323902130127, 1.967618465423584, 1.8991084098815918, 3.4606168270111084, 1.983005404472351, 1.3253878355026245, 2.4068779945373535, 2.092193365097046, 2.913748264312744, 3.6950697898864746, 1.8847883939743042, 3.9062752723693848, 3.2703561782836914, 3.505645513534546, 3.2260842323303223, 3.2517075538635254, 3.2199161052703857, 1.563914179801941, 1.2751253843307495, 3.4483256340026855, 3.2006735801696777, 2.8085670471191406, 2.141472339630127, 1.9739265441894531, 1.387547254562378, 2.8752288818359375, 3.2774477005004883, 1.589269757270813, 2.041024923324585, 3.271522045135498, 3.529395580291748, 3.70666766166687, 2.3791720867156982, 2.6390292644500732, 2.556321144104004, 2.4387898445129395, 3.3210620880126953, 2.6270055770874023, 3.1792120933532715, 1.5982304811477661, 2.2675604820251465, 1.5220553874969482, 2.7580835819244385, 2.727029323577881, 1.7499715089797974, 1.202394962310791, 3.326889753341675, 2.4751460552215576, 3.226959705352783, 3.772934675216675, 3.446662425994873, 2.7435460090637207, 2.569476366043091, 2.008820056915283, 3.8022828102111816, 1.7991786003112793, 1.6427756547927856, 1.7470141649246216, 1.7558846473693848, 2.999722957611084, 3.1047370433807373, 0.4889615476131439, 0.7988244891166687, 0.7328621745109558, 2.5468850135803223, 2.9466731548309326, 1.6884211301803589, 3.3630878925323486, 1.5668151378631592, 3.1875858306884766, 1.0314719676971436, 2.096932888031006, 3.6288743019104004, 1.509647011756897, 2.5287528038024902, 1.6185849905014038]}],                        {\"coloraxis\": {\"colorbar\": {\"title\": {\"text\": \"color\"}}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"height\": 600, \"legend\": {\"tracegroupgap\": 0}, \"margin\": {\"t\": 60}, \"scene\": {\"domain\": {\"x\": [0.0, 1.0], \"y\": [0.0, 1.0]}, \"xaxis\": {\"title\": {\"text\": \"x\"}}, \"yaxis\": {\"title\": {\"text\": \"y\"}}, \"zaxis\": {\"title\": {\"text\": \"z\"}}}, \"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2d\"}], \"histogram2dcontour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2dcontour\"}], \"mesh3d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"mesh3d\"}], \"parcoords\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"parcoords\"}], \"pie\": [{\"automargin\": true, \"type\": \"pie\"}], \"scatter\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter\"}], \"scatter3d\": [{\"line\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatter3d\"}], \"scattercarpet\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattercarpet\"}], \"scattergeo\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergeo\"}], \"scattergl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattergl\"}], \"scattermapbox\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scattermapbox\"}], \"scatterpolar\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolar\"}], \"scatterpolargl\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterpolargl\"}], \"scatterternary\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"scatterternary\"}], \"surface\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"surface\"}], \"table\": [{\"cells\": {\"fill\": {\"color\": \"#EBF0F8\"}, \"line\": {\"color\": \"white\"}}, \"header\": {\"fill\": {\"color\": \"#C8D4E3\"}, \"line\": {\"color\": \"white\"}}, \"type\": \"table\"}]}, \"layout\": {\"annotationdefaults\": {\"arrowcolor\": \"#2a3f5f\", \"arrowhead\": 0, \"arrowwidth\": 1}, \"coloraxis\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"colorscale\": {\"diverging\": [[0, \"#8e0152\"], [0.1, \"#c51b7d\"], [0.2, \"#de77ae\"], [0.3, \"#f1b6da\"], [0.4, \"#fde0ef\"], [0.5, \"#f7f7f7\"], [0.6, \"#e6f5d0\"], [0.7, \"#b8e186\"], [0.8, \"#7fbc41\"], [0.9, \"#4d9221\"], [1, \"#276419\"]], \"sequential\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"sequentialminus\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]]}, \"colorway\": [\"#636efa\", \"#EF553B\", \"#00cc96\", \"#ab63fa\", \"#FFA15A\", \"#19d3f3\", \"#FF6692\", \"#B6E880\", \"#FF97FF\", \"#FECB52\"], \"font\": {\"color\": \"#2a3f5f\"}, \"geo\": {\"bgcolor\": \"white\", \"lakecolor\": \"white\", \"landcolor\": \"#E5ECF6\", \"showlakes\": true, \"showland\": true, \"subunitcolor\": \"white\"}, \"hoverlabel\": {\"align\": \"left\"}, \"hovermode\": \"closest\", \"mapbox\": {\"style\": \"light\"}, \"paper_bgcolor\": \"white\", \"plot_bgcolor\": \"#E5ECF6\", \"polar\": {\"angularaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"radialaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"scene\": {\"xaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"yaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}, \"zaxis\": {\"backgroundcolor\": \"#E5ECF6\", \"gridcolor\": \"white\", \"gridwidth\": 2, \"linecolor\": \"white\", \"showbackground\": true, \"ticks\": \"\", \"zerolinecolor\": \"white\"}}, \"shapedefaults\": {\"line\": {\"color\": \"#2a3f5f\"}}, \"ternary\": {\"aaxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"baxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}, \"bgcolor\": \"#E5ECF6\", \"caxis\": {\"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\"}}, \"title\": {\"x\": 0.05}, \"xaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}, \"yaxis\": {\"automargin\": true, \"gridcolor\": \"white\", \"linecolor\": \"white\", \"ticks\": \"\", \"title\": {\"standoff\": 15}, \"zerolinecolor\": \"white\", \"zerolinewidth\": 2}}}, \"width\": 800},                        {\"responsive\": true}                    ).then(function(){\n",
       "                            \n",
       "var gd = document.getElementById('ff3f6035-6094-46d4-a719-23749abd3072');\n",
       "var x = new MutationObserver(function (mutations, observer) {{\n",
       "        var display = window.getComputedStyle(gd).display;\n",
       "        if (!display || display === 'none') {{\n",
       "            console.log([gd, 'removed!']);\n",
       "            Plotly.purge(gd);\n",
       "            observer.disconnect();\n",
       "        }}\n",
       "}});\n",
       "\n",
       "// Listen for the removal of the full notebook cells\n",
       "var notebookContainer = gd.closest('#notebook-container');\n",
       "if (notebookContainer) {{\n",
       "    x.observe(notebookContainer, {childList: true});\n",
       "}}\n",
       "\n",
       "// Listen for the clearing of the current output cell\n",
       "var outputEl = gd.closest('.output');\n",
       "if (outputEl) {{\n",
       "    x.observe(outputEl, {childList: true});\n",
       "}}\n",
       "\n",
       "                        })                };                });            </script>        </div>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "reducer = umap.UMAP(n_components=3)\n",
    "embedding = reducer.fit_transform(pc_dists)\n",
    "hdbscan_labels = hdbscan.HDBSCAN().fit_predict(embedding)\n",
    "fig = px.scatter_3d(x=embedding[:, 0], y=embedding[:, 1], z=embedding[:, 2], color=hdbscan_labels, width=800, height=600)\n",
    "fig.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# The following is for future features, please disregard\n",
    "\n",
    "### Code used to generate the original random weights\n",
    "**If weights are urgently needed, please add a comment to the existing github issue**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Code originally used to generate and save random weights. Saved and static now to feed into R and compare with lostruct R\n",
    "weights = np.random.random_sample(len(samples))\n",
    "weights = weights*10\n",
    "\n",
    "outfh = open(\"test_data/random_weights.txt\", \"w\")\n",
    "\n",
    "outfh.write(\"{}\\t{}\\n\".format(\"ID\", \"weight\"))\n",
    "for id,w in zip(samples, weights):\n",
    "    outfh.write(\"{}\\t{:.06f}\\n\".format(id, w))\n",
    "\n",
    "del(outfh)\n",
    "np.save(\"test_data/random_weights.npy\", weights)\n",
    "weights"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "weights = np.load(\"test_data/random_weights.npy\")\n",
    "weights"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_pc_dists(windows, fastmath=False, w=1):\n",
    "    \"\"\"\n",
    "    Calculate distances between window matrices.\n",
    "\n",
    "    Works on only the upper triangle of the matrix, but clones the data into the lower half as well.\n",
    "    \"\"\"\n",
    "    n = len(windows)\n",
    "\n",
    "    vals = ls.l1_norm(np.asarray([x[2] for x in windows]))\n",
    "    vals = vals.real.astype(np.float64)\n",
    "    \n",
    "    vecs = np.asarray([x[3] for x in windows])\n",
    "    weights = w[:, np.newaxis]\n",
    "    #sqrt_w = np.squeeze(np.repeat(np.sqrt(weights), result[0][3].shape[0], axis=1))\n",
    "    sqrt_w = np.squeeze(np.sqrt(weights))\n",
    "    print(sqrt_w.shape)\n",
    "    vecs = np.multiply(vecs, sqrt_w)\n",
    "    #vecs = np.multiply(vecs, sqrt_w.T)\n",
    "    #print(vecs)\n",
    "\n",
    "    if fastmath:\n",
    "        comparison = ls.calc_dists_fastmath(n, vals, vecs)\n",
    "    else:\n",
    "        comparison = ls.calc_dists(n, vals, vecs)\n",
    "\n",
    "    # Remove negatives... Can't be placed within Numba code\n",
    "    comparison[comparison < 0] = 0\n",
    "\n",
    "    # Get square root\n",
    "    return np.sqrt(comparison)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "vecs.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#result = list()\n",
    "#for x in windows:\n",
    "#    result.append(ls.eigen_windows(x, 10, weights))\n",
    "#result = np.vstack(result)\n",
    "\n",
    "pc_dists = get_pc_dists(result, fastmath=True, w=weights)\n",
    "mds = pcoa(pc_dists)\n",
    "mds_coords = pd.read_csv(\"lostruct-results/weights_mds_coords.csv\")\n",
    "print(\"Weights compared to Lostruct R:\")\n",
    "print(np.corrcoef(mds.samples['PC1'], mds_coords['MDS1'].to_numpy()))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "pc_dists"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_pc_dists(windows, fastmath=False, w=1):\n",
    "    \"\"\"\n",
    "    Calculate distances between window matrices.\n",
    "\n",
    "    Works on only the upper triangle of the matrix, but clones the data into the lower half as well.\n",
    "    \"\"\"\n",
    "    n = len(windows)\n",
    "    \n",
    "    sqrt_w = np.sqrt(w)\n",
    "    vals = np.multiply(x[2], sqrt_w.T)\n",
    "    \n",
    "    vals = ls.l1_norm(np.asarray([vals for x in windows]))\n",
    "    vals = vals.real.astype(np.float64)\n",
    "\n",
    "    if fastmath:\n",
    "        comparison = calc_dists_fastmath(n, vals, np.asarray([x[3] for x in windows]))\n",
    "    else:\n",
    "        comparison = calc_dists(n, vals, np.asarray([x[3] for x in windows]))\n",
    "\n",
    "    # Remove negatives... Can't be placed within Numba code\n",
    "    comparison[comparison < 0] = 0\n",
    "\n",
    "    # Get square root\n",
    "    return np.sqrt(comparison)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}