{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "992be3e3",
   "metadata": {},
   "outputs": [],
   "source": [
    "import glob\n",
    "import os\n",
    "import re\n",
    "import shutil\n",
    "\n",
    "import nibabel as nib\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import yaml\n",
    "from nilearn import surface\n",
    "from nilearn import plotting\n",
    "from nilearn.masking import unmask\n",
    "from tqdm.auto import tqdm"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "17709863",
   "metadata": {},
   "outputs": [],
   "source": [
    "with open('config.yaml', 'r') as f:\n",
    "    data = yaml.safe_load(f)\n",
    "\n",
    "print(data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "389848af",
   "metadata": {},
   "outputs": [],
   "source": [
    "subject_id = 'CSI1'\n",
    "assert subject_id in data['THINGS-fMRI']\n",
    "paths = data['THINGS-fMRI'][subject_id]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5843f22f",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_processed_subject = os.path.join('..', 'processed', subject_id)\n",
    "os.makedirs(path_processed_subject, exist_ok=True)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "3f993c5e",
   "metadata": {},
   "source": [
    "## T1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5e6a3a10",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_T1_raw = paths['T1']\n",
    "assert os.path.exists(path_T1_raw)\n",
    "print(path_T1_raw)\n",
    "\n",
    "path_T1_processed = os.path.join(path_processed_subject, 'structural', f'{subject_id}_T1w.nii.gz')\n",
    "\n",
    "if not os.path.exists(path_T1_processed):\n",
    "    os.makedirs(os.path.dirname(path_T1_processed), exist_ok=True)\n",
    "    vol_T1 = nib.load(path_T1_raw)\n",
    "    nib.save(vol_T1, path_T1_processed)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "2692a6de",
   "metadata": {},
   "source": [
    "## T2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "2c6b7593",
   "metadata": {},
   "outputs": [],
   "source": [
    "if 'T2' in paths:\n",
    "    path_T2_raw = paths['T2']\n",
    "    assert os.path.exists(path_T2_raw)\n",
    "    print(path_T2_raw)\n",
    "\n",
    "    path_T2_processed = os.path.join(path_processed_subject, 'structural', f'{subject_id}_T2w.nii.gz')\n",
    "\n",
    "    if not os.path.exists(path_T2_processed):\n",
    "        os.makedirs(os.path.dirname(path_T2_processed), exist_ok=True)\n",
    "        vol_T2 = nib.load(path_T2_raw)\n",
    "        nib.save(vol_T2, path_T2_processed)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "3e9c62a4",
   "metadata": {},
   "source": [
    "## Brainmask"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b3eb944a",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_brainmask_raw = paths['brainmask']\n",
    "assert os.path.exists(path_brainmask_raw)\n",
    "print(path_brainmask_raw)\n",
    "\n",
    "path_brainmask_processed = os.path.join(path_processed_subject, 'brainmasks', f'{subject_id}_brainmask.nii.gz')\n",
    "\n",
    "if not os.path.exists(path_brainmask_processed):\n",
    "    os.makedirs(os.path.dirname(path_brainmask_processed), exist_ok=True)\n",
    "    shutil.copy2(path_brainmask_raw, path_brainmask_processed)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "0b20c7db",
   "metadata": {},
   "source": [
    "## Stimuli"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "2594ab72",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_stimuli_raw = paths['stimuli']\n",
    "print(path_stimuli_raw)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4be9ce47",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_session_stimuli = sorted(glob.glob(os.path.join(path_stimuli_raw, f'{subject_id}_sess**/')))\n",
    "for path_session in path_session_stimuli:\n",
    "    print(path_session)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0e1c5827",
   "metadata": {},
   "outputs": [],
   "source": [
    "for path_session in path_session_stimuli:\n",
    "    files = glob.glob(os.path.join(path_session, 'CSI_*.txt'))\n",
    "    for file_path in files:\n",
    "        folder_name = os.path.dirname(file_path)\n",
    "        filename = os.path.basename(file_path)\n",
    "        new_filename = filename.replace('CSI_', 'CSI1_', 1)  # only replace the first occurrence\n",
    "        new_path = os.path.join(folder_name, new_filename)\n",
    "        os.rename(file_path, new_path)\n",
    "        print(f'Renamed: {filename} → {new_filename}')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c46a92c5",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_stimuli_processed = []\n",
    "\n",
    "i_trial = 0\n",
    "for i_session, path_session in enumerate(path_session_stimuli, 1):\n",
    "    assert os.path.exists(path_session)\n",
    "    session_name = os.path.basename(os.path.normpath(path_session))\n",
    "    path_runs = sorted(glob.glob(os.path.join(path_session, f'{session_name}_run*.txt')))\n",
    "    for i_run, path_run in enumerate(path_runs, 1):\n",
    "        data_run = np.loadtxt(path_run, dtype=str)\n",
    "        for stimuli in data_run:\n",
    "            df_stimuli_processed.append({'Session': i_session,\n",
    "                               'Run': i_run,\n",
    "                               'Trial': i_trial,\n",
    "                               'Split': 'test' if 'rep_' in stimuli else 'train',\n",
    "                               'Stimulus': stimuli.split('rep_')[-1]\n",
    "                               })\n",
    "            i_trial += 1\n",
    "\n",
    "df_stimuli_processed = pd.DataFrame(df_stimuli_processed)    "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "589fa549",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_stimuli_processed['Split'].value_counts()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "a0582579",
   "metadata": {},
   "source": [
    "Gather the different names of the stimuli from the different datasets to classify them according to their type."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "04fa3e3a",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_stimuli_info = os.path.dirname(os.path.dirname(paths['stimuli']))\n",
    "path_stimuli_datasets = os.path.join(path_stimuli_info, 'Scene_Stimuli', 'Presented_Stimuli')\n",
    "assert os.path.exists(path_stimuli_datasets)\n",
    "\n",
    "path_stimuli_datasets = sorted(glob.glob(os.path.join(path_stimuli_datasets, '*')))\n",
    "\n",
    "dict_images_dataset = {}\n",
    "for path_stimuli_dataset in path_stimuli_datasets:\n",
    "    assert os.path.exists(path_stimuli_dataset)\n",
    "    dataset_name = os.path.basename(os.path.normpath(path_stimuli_dataset))\n",
    "    list_images_dataset = sorted(glob.glob(os.path.join(path_stimuli_dataset, '*')))\n",
    "    dict_images_dataset[dataset_name] = []\n",
    "    for image in list_images_dataset:\n",
    "        image_name = os.path.basename(image)\n",
    "        dict_images_dataset[dataset_name].append(image_name)\n",
    "    print(f'{dataset_name}: {len(dict_images_dataset[dataset_name])} images')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6144d011",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_labels_imagenet = os.path.join(path_stimuli_info, 'Image_Labels', 'imagenet_final_labels.txt')\n",
    "\n",
    "data_imagenet = []\n",
    "\n",
    "with open(path_labels_imagenet, 'r') as f:\n",
    "    for line in f:\n",
    "        parts = line.strip().split(' ', 1)\n",
    "        label = parts[0]\n",
    "        concept = parts[1].split(',')[0].strip()\n",
    "        data_imagenet.append({'Label': label, 'Concept': concept})\n",
    "\n",
    "df_labels_imagenet = pd.DataFrame(data_imagenet)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8d7dd3ce",
   "metadata": {},
   "outputs": [],
   "source": [
    "for image_label in df_stimuli_processed['Stimulus']:\n",
    "    is_coco = image_label in dict_images_dataset['COCO']\n",
    "    is_imagenet = image_label in dict_images_dataset['ImageNet']\n",
    "    is_scene = image_label in dict_images_dataset['Scene']\n",
    "    if is_coco:\n",
    "        df_stimuli_processed.loc[df_stimuli_processed['Stimulus'] == image_label, 'Dataset'] = 'COCO'\n",
    "        df_stimuli_processed.loc[df_stimuli_processed['Stimulus'] == image_label, 'Type'] = 'multiple'\n",
    "        df_stimuli_processed.loc[df_stimuli_processed['Stimulus'] == image_label, 'Concept'] = np.nan\n",
    "    elif is_imagenet:\n",
    "        df_stimuli_processed.loc[df_stimuli_processed['Stimulus'] == image_label, 'Dataset'] = 'ImageNet'\n",
    "        df_stimuli_processed.loc[df_stimuli_processed['Stimulus'] == image_label, 'Type'] = 'single'\n",
    "        df_stimuli_processed.loc[df_stimuli_processed['Stimulus'] == image_label, 'Concept'] = df_labels_imagenet[df_labels_imagenet['Label'] == image_label.split('_')[0]]['Concept'].item()\n",
    "    elif is_scene:\n",
    "        df_stimuli_processed.loc[df_stimuli_processed['Stimulus'] == image_label, 'Dataset'] = 'Scene'\n",
    "        df_stimuli_processed.loc[df_stimuli_processed['Stimulus'] == image_label, 'Type'] = 'scene'\n",
    "        df_stimuli_processed.loc[df_stimuli_processed['Stimulus'] == image_label, 'Concept'] = re.sub(r'\\d+', '', image_label.split('.')[0])\n",
    "    else:\n",
    "        raise NotImplementedError(f'Stimulus {image_label} not found in any dataset')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a4ed56c5",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_stimuli_processed['Subject'] = subject_id\n",
    "df_stimuli_processed"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6d923354",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_stimuli_processed = os.path.join(path_processed_subject, 'stimuli', f'{subject_id}_stimuli.csv')\n",
    "\n",
    "if not os.path.exists(path_stimuli_processed):\n",
    "    os.makedirs(os.path.dirname(path_stimuli_processed), exist_ok=True)\n",
    "    df_stimuli_processed.to_csv(path_stimuli_processed, index=False)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "33948546",
   "metadata": {},
   "source": [
    "## ROIS"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "0d421580",
   "metadata": {},
   "source": [
    "### Localizers"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "dcc0d46f",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_rois_raw = paths['rois']\n",
    "assert os.path.exists(path_rois_raw)\n",
    "print(path_rois_raw)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d913dc78",
   "metadata": {},
   "outputs": [],
   "source": [
    "vol_brainmask = nib.load(path_brainmask_processed)\n",
    "data_brainmask = vol_brainmask.get_fdata().astype(bool)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d5e9a48c",
   "metadata": {},
   "outputs": [],
   "source": [
    "paths_rois = sorted(glob.glob(os.path.join(path_rois_raw, f'sub-{subject_id}_*.nii.gz')))\n",
    "\n",
    "df_rois = pd.DataFrame({})\n",
    "\n",
    "for i_roi, path_roi in enumerate(paths_rois, 1):\n",
    "    name_roi = os.path.basename(path_roi).split('-')[-1].split('.')[0]\n",
    "\n",
    "    vol_roi = nib.load(path_roi)\n",
    "    data_roi = vol_roi.get_fdata() > 0\n",
    "\n",
    "    masked_roi = data_roi[data_brainmask]  # shape: (num_voxels,)\n",
    "    df_rois[name_roi] = masked_roi.astype(int)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d9b95f01",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_rois_processed = os.path.join(path_processed_subject, 'rois', f'{subject_id}_rois.csv')\n",
    "\n",
    "if not os.path.exists(path_rois_processed):\n",
    "    os.makedirs(os.path.dirname(path_rois_processed), exist_ok=True)\n",
    "    df_rois.to_csv(path_rois_processed, index=False)\n",
    "df_rois"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "f273625c",
   "metadata": {},
   "source": [
    "## Betas"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "18c28dc2",
   "metadata": {},
   "source": [
    "### Volume"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8590df88",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_betas_folder = os.path.join('..', 'dataset', '2.0', '14456124')\n",
    "assert os.path.exists(path_betas_folder)\n",
    "print(path_betas_folder)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "16b41407",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_betas_files = sorted(glob.glob(os.path.join(path_betas_folder, f'{subject_id}_GLMbetas-TYPED-FITHRF-GLMDENOISE-RR_ses-*.nii.gz')))\n",
    "assert len(path_betas_files) > 0"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a8724288",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_betas_vol = os.path.join(path_processed_subject, 'betas', 'vol', f'{subject_id}_betas_vol.npy')\n",
    "os.makedirs(os.path.dirname(path_betas_vol), exist_ok=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5cf7ed64",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_betas_files"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e99a0767",
   "metadata": {},
   "outputs": [],
   "source": [
    "from scipy.stats import zscore\n",
    "\n",
    "if not os.path.exists(path_betas_vol):\n",
    "    data_brainmask_flat = data_brainmask.flatten()\n",
    "    betas = []\n",
    "\n",
    "    for path_data in tqdm(path_betas_files, total=len(path_betas_files)):\n",
    "        assert os.path.exists(path_data)\n",
    "        vol_bold = nib.load(path_data)\n",
    "        data_bold = vol_bold.get_fdata()\n",
    "        data_bold_z = zscore(data_bold.reshape(-1, data_bold.shape[3]), axis=1, nan_policy='omit')\n",
    "        data_bold_z = np.nan_to_num(data_bold_z)\n",
    "        betas = data_bold_z.reshape(data_bold.shape)\n",
    "\n",
    "# betas = np.load(path_betas_vol)\n",
    "# print(betas.shape)\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "40437cc6",
   "metadata": {},
   "source": [
    "### Surface"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "b0c8c8f6",
   "metadata": {},
   "source": [
    "### Left Hemisphere"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d7fb8e40",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_freesurfer = paths['freesurfer']\n",
    "\n",
    "path_mesh_pial_left = os.path.join(path_freesurfer, 'surf', 'lh.pial')\n",
    "path_mesh_white_left = os.path.join(path_freesurfer, 'surf', 'lh.white')\n",
    "\n",
    "assert os.path.exists(path_mesh_pial_left)\n",
    "assert os.path.exists(path_mesh_white_left)\n",
    "\n",
    "print(path_mesh_pial_left)\n",
    "print(path_mesh_white_left)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b674d338",
   "metadata": {},
   "outputs": [],
   "source": [
    "mesh_pial_left = surface.load_surf_mesh(path_mesh_pial_left)\n",
    "mesh_white_left = surface.load_surf_mesh(path_mesh_white_left)\n",
    "num_vertices_left = mesh_pial_left.n_vertices\n",
    "assert mesh_pial_left.n_vertices == mesh_white_left.n_vertices\n",
    "\n",
    "print('Num. Vertices Left:', num_vertices_left)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "be7fcb0b",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_betas_surf_left = os.path.join(path_processed_subject, 'betas', 'surf', f'{subject_id}_betas_surf_lh.npy')\n",
    "\n",
    "os.makedirs(os.path.dirname(path_betas_surf_left), exist_ok=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "34f71402",
   "metadata": {},
   "outputs": [],
   "source": [
    "num_stimuli = betas.shape[0]\n",
    "betas_surf_left = np.zeros((num_stimuli, num_vertices_left), dtype=np.float32)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "086ab25c",
   "metadata": {},
   "outputs": [],
   "source": [
    "vol_betas_stimulus.get_fdata()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6a3012c3",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0351a0a4",
   "metadata": {},
   "outputs": [],
   "source": [
    "if not os.path.exists(path_betas_surf_left):\n",
    "    for i_stimulus in tqdm(range(num_stimuli)):\n",
    "        betas_stimulus = betas[i_stimulus, :]\n",
    "        vol_betas_stimulus = unmask(betas_stimulus, vol_brainmask)\n",
    "        betas_surf_left[i_stimulus, :] = surface.vol_to_surf(vol_betas_stimulus,\n",
    "                                                             surf_mesh=mesh_pial_left,\n",
    "                                                             inner_mesh=mesh_white_left,\n",
    "                                                             interpolation='linear',\n",
    "                                                             kind='depth',\n",
    "                                                             depth=[0.5])\n",
    "    # np.save(path_betas_surf_left, betas_surf_left)\n",
    "\n",
    "betas_surf_left = np.load(path_betas_surf_left)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "69cf01d6",
   "metadata": {},
   "source": [
    "#### Right Hemisphere"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7d324db8",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_betas_surf_right = os.path.join(path_processed_subject, 'betas', 'surf', f'{subject_id}_betas_surf_rh.npy')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "61305d12",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_mesh_pial_right = os.path.join(path_freesurfer, 'surf', 'rh.pial')\n",
    "path_mesh_white_right = os.path.join(path_freesurfer, 'surf', 'rh.white')\n",
    "\n",
    "assert os.path.exists(path_mesh_pial_right)\n",
    "assert os.path.exists(path_mesh_white_right)\n",
    "\n",
    "print(path_mesh_pial_right)\n",
    "print(path_mesh_white_right)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "322d679c",
   "metadata": {},
   "outputs": [],
   "source": [
    "mesh_pial_right = surface.load_surf_mesh(path_mesh_pial_right)\n",
    "mesh_white_right = surface.load_surf_mesh(path_mesh_white_right)\n",
    "num_vertices_right = mesh_pial_right.n_vertices\n",
    "assert mesh_pial_right.n_vertices == mesh_white_right.n_vertices\n",
    "\n",
    "print('Num. Vertices Right:', num_vertices_right)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "43714fdf",
   "metadata": {},
   "outputs": [],
   "source": [
    "betas_surf_right = np.zeros((num_stimuli, num_vertices_right), dtype=np.float32)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "56912964",
   "metadata": {},
   "outputs": [],
   "source": [
    "\"\"\"\n",
    "if not os.path.exists(path_betas_surf_right):\n",
    "    for i_stimulus in tqdm(range(num_stimuli)):\n",
    "        betas_stimulus = betas[i_stimulus, :]\n",
    "        vol_betas_stimulus = unmask(betas_stimulus, vol_brainmask)\n",
    "        betas_surf_right[i_stimulus, :] = surface.vol_to_surf(vol_betas_stimulus,\n",
    "                                                              surf_mesh=mesh_pial_right,\n",
    "                                                              inner_mesh=mesh_white_right,\n",
    "                                                              interpolation='linear',\n",
    "                                                              kind='depth',\n",
    "                                                              depth=[0.5])\n",
    "    np.save(path_betas_surf_right, betas_surf_right)\n",
    "\"\"\""
   ]
  },
  {
   "cell_type": "markdown",
   "id": "0a43cdd2",
   "metadata": {},
   "source": [
    "## Visualize betas"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "74c89ea9",
   "metadata": {},
   "outputs": [],
   "source": [
    "path_inflated = os.path.join(path_freesurfer, 'surf', f'lh.inflated')\n",
    "assert os.path.exists(path_inflated)\n",
    "\n",
    "mesh_inflated = surface.load_surf_mesh(path_inflated)\n",
    "print(mesh_inflated.n_vertices)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "aa856a35",
   "metadata": {},
   "outputs": [],
   "source": [
    "idx_stimulus = 0\n",
    "\n",
    "fig = plotting.plot_surf_stat_map(\n",
    "    surf_mesh=mesh_inflated,\n",
    "    stat_map=np.std(betas_surf_left, axis=0),\n",
    "    hemi='left',\n",
    "    view='lateral',\n",
    "    cmap='cold_hot',\n",
    "    title=f'Subject {subject_id} Beta Map (Inflated)',\n",
    "    colorbar=True,\n",
    "    engine='plotly',\n",
    "    vmin=-5,\n",
    "    vmax=5\n",
    ")\n",
    "fig.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3d7ee0af",
   "metadata": {},
   "outputs": [],
   "source": [
    "from scipy.stats import zscore\n",
    "\n",
    "def zscore_betas(betas, df_stimuli):\n",
    "    assert np.isnan(betas).sum() == 0, 'Betas contain NaN values'\n",
    "    indices_session = df_stimuli['Session'].values\n",
    "    betas_zscore = np.zeros_like(betas)\n",
    "    sessions = np.unique(indices_session)\n",
    "    num_sessions = len(sessions)\n",
    "    for i_session in tqdm(sessions, total=num_sessions):\n",
    "        indices = np.where(indices_session == i_session)[0]\n",
    "        betas_zscore[indices] = zscore(betas[indices], axis=0)\n",
    "    print(np.sum(np.isnan(betas_zscore)))\n",
    "    return betas_zscore"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "bdd0cc7b",
   "metadata": {},
   "outputs": [],
   "source": [
    "betas_zeta_lh = zscore_betas(betas_surf_left, df_stimuli_processed)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9a365e93",
   "metadata": {},
   "outputs": [],
   "source": [
    "betas_surf_left.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "707ae1a5",
   "metadata": {},
   "outputs": [],
   "source": [
    "vol_T1 = nib.load(path_T1_processed)\n",
    "betas_stimulus = betas[idx_stimulus, :]\n",
    "betas_stimulus = zscore(betas_stimulus)\n",
    "vol_betas_stimulus = unmask(betas_stimulus, vol_brainmask)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "351467a9",
   "metadata": {},
   "outputs": [],
   "source": [
    "plotting.plot_stat_map(vol_betas_stimulus, bg_img=vol_T1, vmin=-3, vmax=3)\n",
    "plotting.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b5029ca0",
   "metadata": {},
   "outputs": [],
   "source": [
    "betas[idx_stimulus, :].shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "280fa1c3",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "src",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.0"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
