# Plot clusters

In [None]:
# Magic
%matplotlib inline
# Reload modules whenever they change
%load_ext autoreload
%autoreload 2

# Make clusterking package available even without installation
import sys
sys.path = ["../../"] + sys.path

In [None]:
import pandas as pd
import os.path
import matplotlib.pyplot as plt
from mpl_toolkits.mplot3d import Axes3D
from pathlib import Path

from clusterking.plots import ClusterPlot
from clusterking.data.data import Data

In [None]:
d = Data("output/tutorial_basics.sql")

## Manual Plotting

In [None]:
colors = ["red", "green", "blue", "pink"]
markers = ["o", "v", "^"]
df = d.df
clusters = df.cluster.unique()

### Manual 3d Plot

In [None]:
ax = plt.figure().gca(projection='3d')
ax.set_xlabel('CVL_bctaunutau')
ax.set_ylabel('sl')
ax.set_zlabel('CT_bctaunutau')

for index, cluster in enumerate(clusters):
    df_cluster = df[df['cluster'] == cluster]
    ax.scatter(
        df_cluster['CVL_bctaunutau'], 
        df_cluster['CSL_bctaunutau'], 
        df_cluster['CT_bctaunutau'], 
        color=colors[cluster % len(colors)], 
        marker=markers[cluster % len(markers)],
        label=cluster
    )

plt.legend(loc='upper left');
plt.show()

### Manual 2d Plot

In [None]:
fig, ax = plt.subplots()
ax.set_xlabel('CVL_bctaunutau')
ax.set_ylabel('CSL_bctaunutau')

# fix remaining Wilson coefficients
t_value_index = 1
t_value = df['CT_bctaunutau'].unique()[t_value_index]

for index, cluster in enumerate(clusters):
    df_cluster = df[df['cluster'] == cluster]
    df_cluster = df_cluster[df_cluster['CT_bctaunutau'] == t_value]
    ax.scatter(
        df_cluster['CVL_bctaunutau'], 
        df_cluster['CSL_bctaunutau'], 
        color=colors[cluster % len(colors)], 
        marker=markers[cluster % len(markers)],
        label=cluster
    )

plt.legend(bbox_to_anchor=(1.2, 1.0));
plt.show()

## Using ``ClusterPlot``

<div class="alert alert-danger">
The Interface via the class <code>ClusterPlot</code> might change or disappear in the future.
</div>

Set up the plotter:

In [None]:
cp = ClusterPlot(d)

In [None]:
cp.draw_legend=True

### 3D plots

Scatter plot: The list is the list of the columns on the axes. 
Changing the order of the columns will turn around the cube. 

In [None]:
cp.scatter(['CVL_bctaunutau', 'CSL_bctaunutau', 'CT_bctaunutau'])

If it is still not easy to get an overview, use the ``clusters`` argument to limit ourselves to certain clusters.

In [None]:
cp.scatter(['CVL_bctaunutau', 'CSL_bctaunutau', 'CT_bctaunutau'], clusters=[0, 2])

If only two columns are given, several cuts will be presented (up to 16 by default):

### 2D cuts

In [None]:
cp.scatter(['CVL_bctaunutau', 'CSL_bctaunutau'])

Again, we can also limit ourselves on the clusters that we want to display:

In [None]:
cp.scatter(['CVL_bctaunutau', 'CSL_bctaunutau'], clusters=[1,2])

If many wilson points are available, it is better to switch to a 'fill' plot:

In [None]:
cp.fill(['CVL_bctaunutau', 'CSL_bctaunutau'])

### More configuration

Several options to configure the the ClusterPlot object can be changed after the object has been initialized.

The number of plots for the 'slices' by

In [None]:
cp.max_subplots

Let's change that (note that no warning is issued when trying to set a non-existing property, so do be careful with your typing):

In [None]:
cp.max_subplots = 3

And try it out:

In [None]:
cp.scatter(['CVL_bctaunutau', 'CSL_bctaunutau'])

In [None]:
cp.fill(['CVL_bctaunutau', 'CSL_bctaunutau'])

To see all options, see the ``Attribute`` section of the help.

In [None]:
help(cp)