{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "This notebook is based on the example [script](https://github.com/katkost/MazurkaBL/blob/master/scripts/ismir_tutorial.ipynb) in the MazurkaBL repository.\n",
    "\n",
    "**Run this from within the `scripts` folder of the MazurkaBL repository (git commit: 00c5b67cc5a1a0d9b7cce401729f2bca666aa6f5).**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "%matplotlib inline"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Import libraries"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import glob\n",
    "%matplotlib inline\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "sns.set()\n",
    "\n",
    "import pandas as bd\n",
    "import IPython.display as ipd\n",
    "from scipy.io import wavfile\n",
    "from IPython.display import Image\n",
    "from data_processing import prepare_dataset, get_names_from_mazurka, plot_beat_dyn, plot_dyn_with_markings_values_boxplots, plot_dyn_change_curves, prepare_dataset_change_points, get_clusters_and_print_outlier_cluster_names, plot_sones_with_cp, plot_total_cps, get_seconds_for_change_points, get_change_point_positions_in_sone_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Retrieving information from the .csv files...\n",
      "Done!\n"
     ]
    }
   ],
   "source": [
    "files_beat = glob.glob('../beat_time/*.csv')\n",
    "files_dyn = glob.glob('../beat_dyn/*.csv')\n",
    "files_mark = glob.glob('../markings/*.csv')\n",
    "files_mark_dyn = glob.glob('../markings_dyn/*.csv')\n",
    "Mazurka_info = prepare_dataset(files_beat, files_dyn, files_mark, files_mark_dyn)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Retrieve the change point data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Retrieving information from the change points data files...\n",
      "Done!\n"
     ]
    }
   ],
   "source": [
    "folder_sones = ('../sones/')\n",
    "files_cp_per_recording_in_mazurka = glob.glob('../change_points_data/cp_per_maz_rec_PELT/*.txt')\n",
    "files_total_cp = glob.glob('../change_points_data/cp_per_beat_tables_PELT/*.csv')\n",
    "\n",
    "Mazurka_info_cp = prepare_dataset_change_points(folder_sones, files_cp_per_recording_in_mazurka, files_total_cp, files_mark)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "pianist_general = Mazurka_info['M17-4'][1]\n",
    "pianist = Mazurka_info_cp['M17-4'][1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[np.int64(10),\n",
       " np.int64(171),\n",
       " np.int64(656),\n",
       " np.int64(1246),\n",
       " np.int64(1885),\n",
       " np.int64(2230),\n",
       " np.int64(3025),\n",
       " np.int64(4704),\n",
       " np.int64(5415),\n",
       " np.int64(6131),\n",
       " np.int64(6685),\n",
       " np.int64(8193),\n",
       " np.int64(9607),\n",
       " np.int64(9888),\n",
       " np.int64(10468),\n",
       " np.int64(10995),\n",
       " np.int64(11570),\n",
       " np.int64(12142),\n",
       " np.int64(12676),\n",
       " np.int64(12931),\n",
       " np.int64(13463),\n",
       " np.int64(15248),\n",
       " np.int64(15797),\n",
       " np.int64(16657),\n",
       " np.int64(18699),\n",
       " np.int64(19464),\n",
       " np.int64(19750)]"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "seconds_for_change_points = get_seconds_for_change_points(pianist_general.beat, pianist.cp)\n",
    "change_point_positions_in_sone_data = get_change_point_positions_in_sone_data(pianist.sones['time_frame_in_sec'], seconds_for_change_points)\n",
    "change_point_positions_in_sone_data # this is the ground truth that we consider"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "np.savetxt(\"sones.txt\", np.array(Mazurka_info_cp['M17-4'][1].sones[\"sone_value\"]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'pid50534-05'"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pianist_general[0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
