import marimo

__generated_with = "0.23.8"
app = marimo.App()


@app.cell
def _():
    import marimo as mo

    return (mo,)


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    # 4. Running a full analysis

    In this tutorial we'll perform a real analysis on part of the open dataset from ["A Data-Driven Characterisation Of Natural Facial Expressions When Giving Good And Bad News"](https://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1008335) by Watson & Johnston 2020.

    In the original paper the authors had 3 speakers deliver *good* or *bad* news while filming their facial expressions. They found that could accurately "decode" each condition based on participants' facial expressions extracted either using a custom multi-chanel-gradient model or action units (AUs) extracted using [Open Face](https://github.com/TadasBaltrusaitis/OpenFace).

    In this tutorial we'll show how easily it is to not only reproduce their decoding analysis with py-feat, but just as easily perform additional analyses. Specifically we'll:

    1. Download 20 of the first subject's videos (the full dataset is available on [OSF](https://osf.io/6tbwj/)
    2. Extract facial features using the `Detectorv2`
    3. Aggregate and summarize detections per video using `Fex`
    2. Train and test a decoder to classify *good* vs *bad* news using extracted emotions, AUs, and poses
    3. Run a fMRI style "mass-univariate" comparison across all AUs between conditions
    4. Run a time-series analysis comparing videos based on the time-courses of extracted facial features
    """)
    return


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    ## 4.1 The data

    We'll analyze 20 short clips from the [Watson & Johnston (2020)](https://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1008335) "good news vs bad news" dataset — 10 of each. To keep this tutorial fast and offline, the per-frame `Detectorv2` outputs are **pre-computed and bundled with the docs** under `docs/data/news_sample/`, so we load them directly instead of downloading videos and re-running detection. The full dataset is on [OSF](https://osf.io/6tbwj/).
    """)
    return


@app.cell
def _():
    from glob import glob
    from pathlib import Path

    import matplotlib.pyplot as plt
    import numpy as np
    import pandas as pd
    import seaborn as sns

    sns.set_context("talk")

    # Pre-computed per-frame Detectorv2 outputs (20 AUs + 7 emotions + valence/
    # arousal + head pose + gaze + the 478-vertex mesh landmarks + 52 blendshapes)
    # for the 20 bundled clips, generated with skip_frames=2 and committed under
    # docs/data/news_sample/ so this tutorial runs offline.
    data_dir = Path(__file__).resolve().parent.parent / "data" / "news_sample"
    videos = [Path(c).stem + ".mp4" for c in sorted(glob(str(data_dir / "0*.csv")))]

    clip_attrs = pd.read_csv(data_dir / "clip_attrs.csv").assign(
        input=lambda d: d.clipN.apply(lambda x: str(x).zfill(3) + ".mp4"),
        condition=lambda d: d["class"].replace({"gn": "goodNews", "ists": "badNews"}),
    )
    clip_attrs = clip_attrs.query("input in @videos")

    print(
        f"{len(videos)} clips: "
        f"{(clip_attrs.condition == 'goodNews').sum()} good news, "
        f"{(clip_attrs.condition == 'badNews').sum()} bad news"
    )
    return clip_attrs, data_dir, np, pd, plt, sns, videos


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    ## 4.2 How the detections were generated

    The bundled CSVs were produced by running the `Detectorv2` over each clip and saving its per-frame output. You don't need to run this — we load the saved CSVs in the next section — but here's the code that made them:

    ```python
    from feat import Detectorv2

    detector = Detectorv2(device="cuda")  # or "mps" / "cpu"
    for video in videos:
        fex = detector.detect(video, data_type="video", batch_size=8, skip_frames=2)
        fex.to_csv(video.replace(".mp4", ".csv"), index=False)
    ```

    `read_feat` recognizes these as `Detectorv2` output (from their valence/arousal
    and 478-vertex mesh columns) and restores the matching `.aus` / `.emotions` /
    `.poses` / `.gazes` accessors.
    """)
    return


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    ## 4.3. Aggregate detections using a `Fex` dataframe
    """)
    return


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    Then we can use `read_feat` to load each CSV file and concatenate them together:
    """)
    return


@app.cell
def _(data_dir, pd, videos):
    from feat.utils.io import read_feat
    fex_1 = pd.concat(
        read_feat(str(data_dir / video.replace(".mp4", ".csv"))) for video in videos
    )
    print(f'Unique videos: {fex_1.inputs.nunique()}')
    print(f'Total processed frames: {fex_1.shape[0]}')
    print(f"Avg frames per video: {fex_1.groupby('input').size().mean()}")
    return (fex_1,)


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    Our `Fex` dataframe now contains all detections for all frames of each video
    """)
    return


@app.cell
def _(fex_1):
    fex_1.shape
    fex_1.head()
    return


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    ### Summarize data with `Fex.sessions`

    `Fex` dataframes have a special attribute called `.sessions` that act as a grouping factor to make it easier to compute summary statistics with any of the `.extract_*` methods. By default `.sessions` is `None`, but you can use the `.update_sessions()` to return **a new Fex dataframe** with `.sessions` set.

    For example, if we update the sessions to be the name of each video, then `.extract_mean()` will group video-frames (rows) by video making it easy to compute a single summary statistic per file:
    """)
    return


@app.cell
def _(fex_1):
    by_video = fex_1.update_sessions(fex_1['input'])
    video_means = by_video.extract_mean()
    # Compute the mean per video
    video_means  # 20 rows for 20 videos
    return by_video, video_means


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    Then we can grab the AU detections and call standard pandas methods like `.loc` and `.plot`:
    """)
    return


@app.cell
def _(sns, video_means):
    # Grab the aus just for video 1
    video001_aus = video_means.aus.loc['001.mp4']
    _ax = video001_aus.plot(kind='bar', title='Video 001 AU detection')
    # Plot them
    _ax.set(ylabel='Average Probability')
    sns.despine()
    _ax.figure
    return


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    ### Chaining operations
    """)
    return


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    `.update_sessions()` always returns a **copy** of the Fex object, so that you can **chain** operations together including existing pandas methods like `.plot()`. Here's an example passing a dictionary to `.update_sessions()`, which maps between old and new session names:
    """)
    return


@app.cell
def _(by_video, clip_attrs, plt, sns):
    # Which condition each video belonged to
    video2condition = dict(zip(clip_attrs['input'], clip_attrs['condition']))
    _ax = by_video.update_sessions(video2condition).extract_mean().aus.plot(kind='bar', legend=False, title='Mean AU detection by condition')
    _ax.set(ylabel='Average Probability', title='AU detection by condition', xticklabels=['Good News', 'Bad News'])  # if loading pre-computed csv
    plt.xticks(rotation=0)  # clip_attrs["input"].str.replace(".mp4", ".csv", regex=False),
    # Update sessions to group by condition, compute means (per condition), and make a
    # barplot of the mean AUs for each condition
    sns.despine()
    _ax.figure
    return (video2condition,)


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    We can also focus in on the AUs associated with happiness:
    """)
    return


@app.cell
def _(by_video, np, plt, sns, video2condition):
    aus = ['AU06', 'AU12', 'AU25']  # from https://py-feat.org/pages/au_reference.html
    summary = by_video.update_sessions(video2condition).extract_summary(mean=True, sem=True, std=False, min=False, max=False)
    # Update the sessions to condition compute summary stats
    bad_means = summary.loc['badNews', [f'mean_{au}' for au in aus]]
    bad_sems = summary.loc['badNews', [f'sem_{au}' for au in aus]]
    good_means = summary.loc['goodNews', [f'mean_{au}' for au in aus]]
    good_sems = summary.loc['goodNews', [f'sem_{au}' for au in aus]]
    # Organize them for plotting
    fig, _ax = plt.subplots(figsize=(3, 4))
    ind = np.arange(len(bad_means))
    width = 0.35
    rects1 = _ax.bar(ind - width / 2, bad_means, width, yerr=bad_sems, label='Bad News')
    rects2 = _ax.bar(ind + width / 2, good_means, width, yerr=good_sems, label='Good News')
    # Plot
    _ax.set(ylabel='Average Probability', title='', xticks=ind, xticklabels=aus, ylim=(0, 1))
    _ax.legend(loc='upper left', frameon=False, bbox_to_anchor=(0, 1.25))
    plt.axhline(0.5, ls='--', color='k')
    sns.despine()
    plt.xticks(rotation=45)
    plt.tight_layout()
    fig
    return


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    ## 4.4 Comparing the condition difference across AUs using regression

    One way we can compare what AUs in the plot show significant differences is by using the `.regress()` method along with numerical contrast codes. For example we can test the difference in activation of every AU when participants delivered *good* vs *bad* news.

    This is analogous to the "mass-univariate" GLM approach in fMRI research, and allows us to identify what AUs are significantly more active in one condition vs another:
    """)
    return


@app.cell
def _(pd, sns, video2condition, video_means):
    # Save the by_condition fex from above
    by_condition = video_means.update_sessions(video2condition)
    by_condition_codes = by_condition.update_sessions({'goodNews': 1.0, 'badNews': -1})
    # We set numerical contrasts to compare mean good news > mean bad news
    b, se, t, p, df, residuals = by_condition_codes.regress(X='sessions', y='aus', fit_intercept=True)
    p_bonf = p / p.shape[1]
    # Now we perform a regression (t-test) at every AU
    _results = pd.concat([b.round(3).loc[['sessions']].rename(index={'sessions': 'betas'}), se.round(3).loc[['sessions']].rename(index={'sessions': 'ses'}), t.round(3).loc[['sessions']].rename(index={'sessions': 't-stats'}), df.round(3).loc[['sessions']].rename(index={'sessions': 'dof'}), p_bonf.round(3).loc[['sessions']].rename(index={'sessions': 'p-values'})])
    _ax = _results.loc['betas'].plot(kind='bar', yerr=_results.loc['ses'], color=['steelblue' if elem else 'gray' for elem in _results.loc['p-values'] < 0.01], title='Good News > Bad News\n(blue: p < .01)')
    xticks = _ax.get_xticklabels()
    xticks = [elem.get_text().split('_')[-1] for elem in xticks]
    # We can perform bonferroni correction for multiple comparisons:
    _ax.set_xticklabels(xticks)
    _ax.set_ylabel('Beta +/- SE')
    sns.despine()
    _ax.figure
    return (by_condition,)


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    ## 4.5 Decoding condition from facial features

    We can easily perform an analysis just like Watson et al, by training a LinearDiscriminantAnalysis (LDA) decoder to classify which condition a video came from based on average **AU** and **headpose** detections.

    To do this we can use the `.predict()` which behaves just like `.regress()` but also requires a `sklearn` `Estimator`. We can use keyword arguments to perform 10-fold cross-validation to test the accuracy of each decoder:
    """)
    return


@app.cell
def _(by_condition, pd, plt, sns):
    from sklearn.discriminant_analysis import LinearDiscriminantAnalysis
    from sklearn.preprocessing import StandardScaler
    from sklearn.pipeline import make_pipeline
    feature_list = ['emotions', 'aus', 'poses', 'emotions,poses', 'aus,poses']  # always a good idea to normalize your features!
    _results = []
    models = {}
    # List of different models we'll train
    for features in feature_list:
        model, accuracy = by_condition.predict(X=features, y='sessions', model=make_pipeline(StandardScaler(), LinearDiscriminantAnalysis()), cv_kwargs={'cv': 10})
        models[features] = model
        _results.append(pd.DataFrame({'Accuracy': accuracy * 100, 'Features': [features] * len(accuracy)}))
        print(f'{features} model accuracy: {accuracy.mean() * 100:.3g}% +/- {accuracy.std() * 100:.3g}%')
    _results = pd.concat(_results).assign(Features=lambda df: df.Features.map({'emotions': 'Emotions', 'poses': 'Pose', 'aus': 'AUs', 'emotions,poses': 'Emotions\n+ Pose', 'aus,poses': 'AUs+Pose'}))
    f, _ax = plt.subplots(1, 1, figsize=(3.75, 4))  # .predict is just like .regress, but this time session is our y.
    _ax = sns.barplot(x='Features', y='Accuracy', errorbar='sd', dodge=False, hue='Features', data=_results, ax=_ax, order=['Emotions', 'Emotions\n+ Pose', 'AUs+Pose', 'AUs', 'Pose'])
    _legend = _ax.get_legend()
    if _legend is not None:
        _legend.remove()
    _ax.set_title('Good News vs Bad News\nClassifier Performance')
    _ax.set(ylabel='Accuracy', xlabel='')
    sns.despine()
    plt.axhline(y=50, ls='--', color='k')
    plt.xticks(rotation=90)
    plt.tight_layout()  # Save the model
    # Concat results into a single dataframe and tweak column names
    # Plot it
    # with sns.plotting_context("talk", font_scale=1.8):
    f
    return (models,)


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    ### Visualizing decoder weights
    Using what we learned in the previous tutorial, we can visualize the coefficients for any models that used AU features. This allows us to "see" the underlying facial expression that the classifier learned!
    """)
    return


@app.cell
def _(models, np, plt):
    from feat.plotting import plot_face_mesh

    # The 'aus' pipeline's LDA coefficients are signed weights over the 20 AUs.
    # Min-max scale them into a positive AU-intensity range, then render the
    # predicted 478-vertex mesh so we can "see" the (good-news-leaning) expression
    # the classifier learned — the Detectorv2 analog of the 68-pt plot_face.
    _coef = models['aus'][1].coef_.squeeze()
    _au = (_coef - _coef.min()) / (np.ptp(_coef) + 1e-12) * 2.0

    _fig = plt.figure(figsize=(5, 5))
    _ax = _fig.add_subplot(111, projection="3d")
    plot_face_mesh(au=_au, ax=_ax, mode="tesselation")
    _ax.set_title("Expression reconstructed from\nAU classifier weights")
    _fig
    return


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    You can also *animate* this expression to emphasize what's changing — pass the
    same scaled AU-weight vector as `end` (and a neutral `np.zeros(20)` as `start`)
    to `animate_face_mesh_plotly` for an interactive 3D morph. See
    [tutorial 3](Plotting.md) for animation examples.
    """)
    return


@app.cell(hide_code=True)
def _(mo):
    mo.md(r"""
    ## 4.6 Time-series analysis

    Finally we might be interested in looking the similarity of the detected features **over time**. We can do that using the `.isc()` method which takes a column and metric to use. Here we compare detected happiness between all pairs of videos.

    We use some helper functions to cluster, sort, and plot the correlation matrix. Warmer colors indicate a pair of videos elicited more *similar* detected Happiness over time. We see that some videos show high-correlation in-terms of their detected happiness over-time. This is likely why the classifier above was able to decode conditions so well.
    """)
    return


@app.cell
def _(fex_1):
    # ISC returns a video x video pearson correlation matrix.
    # Detectorv2 emotion columns are capitalized ('Happy', not 'happiness').
    isc = fex_1.isc(col='Happy', method='pearson')
    return (isc,)


@app.cell
def _(isc, np, plt, sns, video2condition):
    def cluster_corrs(df):
        """Helper to reorder rows and cols of correlation matrix based on clustering"""
        import scipy.cluster.hierarchy as sch
        pairwise_distances = sch.distance.pdist(df)
        linkage = sch.linkage(pairwise_distances, method='complete')
        cluster_distance_threshold = pairwise_distances.max() / 2
        idx_to_cluster_array = sch.fcluster(linkage, cluster_distance_threshold, criterion='distance')
        idx = np.argsort(idx_to_cluster_array)
        return df.iloc[idx, :].T.iloc[idx, :]

    def add_cond_to_ticks(ax):
        """Helper to add condition info to each tick label"""
        xlabels, ylabels = ([], [])
        for xlabel, ylabel in zip(_ax.get_xticklabels(), _ax.get_yticklabels()):
            x_condition = video2condition[xlabel.get_text()]
            y_condition = video2condition[ylabel.get_text()]
            x_new = f"{x_condition[:-4]}_{xlabel.get_text().split('.csv')[0][1:]}"
            y_new = f"{y_condition[:-4]}_{ylabel.get_text().split('.csv')[0][1:]}"
            xlabels.append(x_new)
            ylabels.append(y_new)
        _ax.set_xticklabels(xlabels)
        _ax.set_yticklabels(ylabels)
        return _ax
    _ax = sns.heatmap(cluster_corrs(isc), cmap='RdBu_r', vmin=-1, vmax=1, square=True)
    _ax = add_cond_to_ticks(_ax)
    _ax.set(xlabel='', ylabel='', title='Inter-video Happiness\ntimeseries correlation')
    # Plot it
    _ax.figure
    return


if __name__ == "__main__":
    app.run()