{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "\"\"\"\n",
    "Execute the following cells to run the experiments\n",
    "\n",
    "Note:\n",
    "- The experiments are computationally expensive. Therefore, it is recommended to run them on a machine with multiple cores.\n",
    "- To change the distribution of the inlier clusters from Gaussian to t-distribution, set the parameter dist='t' in 'run_mixture_learning_experiment'.\n",
    "\n",
    "\"\"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "import rml_experiments\n",
    "import eval_performance as eval_perf\n",
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Gaussian Experiment"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_gauss = rml_experiments.run_mixture_learning_experiment(num_runs=1, multiprocessing_adv = True, gauss_multifilter=True, iterations_per_seed=8)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Adversarial Clusters Line Experiment"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_adv_line = rml_experiments.run_mixture_learning_experiment(num_runs=1, noise_model='adv', multiprocessing_adv = True, gauss_multifilter=True, iterations_per_seed=100)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Adversarial Clusters Circle Experiment"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_adv_circle = rml_experiments.run_mixture_learning_experiment(num_runs=1, noise_model='adv_circle', multiprocessing_adv=True, r=10, gauss_multifilter=True, iterations_per_seed=100)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Experiment Plots"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "seed = 0\n",
    "excluded_methods = ['Inner Stage']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "### Generate scatter plots\n",
    "eval_perf.plot_experiment_datapoints(df_gauss, excluded_methods=excluded_methods, seed=seed)\n",
    "eval_perf.plot_experiment_datapoints(df_adv_circle, noise_model='adv_circle', excluded_methods=excluded_methods, seed=seed)\n",
    "eval_perf.plot_experiment_datapoints(df_adv_line, noise_model='adv', excluded_methods=excluded_methods, seed=seed)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "### Generate bar plots\n",
    "output = eval_perf.plot_all_noise_models_quantile_average(constraint='list', df_adv_line=df_adv_line, df_gauss=df_gauss, df_adv_circle=df_adv_circle, max_val=80, excluded_methods=excluded_methods, percentile_constraint=80, seed=seed, log_scale=False)\n",
    "output = eval_perf.plot_all_noise_models_quantile_average(constraint='err', df_adv_line=df_adv_line, df_gauss=df_gauss, df_adv_circle=df_adv_circle, max_val=30, excluded_methods=excluded_methods, percentile_constraint=30, percentile_points=75, seed=seed, log_scale=False)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "base",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
