import os
import argparse
from math import ceil
import yaml
import torch
import numpy as np
import matplotlib.pyplot as plt
from bayes_dip.utils.plot_utils import DEFAULT_COLORS, configure_matplotlib
from bayes_dip.utils.evaluation_utils import extract_tensorboard_scalars, find_single_log_file, translate_path

parser = argparse.ArgumentParser()
parser.add_argument('--runs_file', type=str, default='runs_walnut_dip_mll_optim.yaml', help='path of yaml file containing hydra output directory names')
parser.add_argument('--experiments_outputs_path', type=str, default='../experiments/outputs', help='base path containing the hydra output directories (usually "[...]/outputs/")')
parser.add_argument('--experiments_multirun_path', type=str, default='../experiments/multirun', help='base path containing the hydra multirun directories (usually "[...]/multirun/")')
parser.add_argument('--save_data_to', type=str, default='', help='path to cache the plot data, such that they can be loaded with --load_data_from')
parser.add_argument('--load_data_from', type=str, default='', help='load data cached from a previous run with --save_data_to')
parser.add_argument('--tag_list', type=str, nargs='*', default=[], help='tensorboard tags to plot (e.g. "GPprior_lengthscale_0 GPprior_variance_0 NormalPrior_variance_2 observation_noise_variance"); if empty, plots all hyperparameters of GPprior and NormalPrior priors and the noise variance')
parser.add_argument('--suffix', type=str, default='', help='suffix for the figure filenames (e.g. summarizing the --tag_list)')
parser.add_argument('--rows', type=int, default=1, help='number of subplot rows')
parser.add_argument('--skip_sub_plots', type=int, nargs='*', default=[], help='subplot indices to skip (will be empty subplots)')
parser.add_argument('--legend_pos', type=int, default=-1, help='subplot index to place the legend in')
parser.add_argument('--legend_loc', type=str, default='', help='legend loc argument')
parser.add_argument('--legend_bbox_to_anchor', type=float, nargs='*', default=[], help='legend bbox_to_anchor argument')
parser.add_argument('--hspace', type=float, default=0.275, help='matplotlib\'s "hspace" gridspec_kw')
parser.add_argument('--wspace', type=float, default=0.275, help='matplotlib\'s "wspace" gridspec_kw')
args = parser.parse_args()

experiment_paths = {
        'outputs_path': args.experiments_outputs_path,
        'multirun_path': args.experiments_multirun_path,
}

with open(args.runs_file, 'r') as f:
    runs = yaml.safe_load(f)


def collect_walnut_hyperparams_figure_data(runs):
    data = {}

    log_file = find_single_log_file(os.path.join(
            translate_path(runs['include_predcp_False'], experiment_paths=experiment_paths),
            'mrglik_optim_0'))
    data['scalars'] = extract_tensorboard_scalars(log_file=log_file)

    log_file_predcp = find_single_log_file(os.path.join(
            translate_path(runs['include_predcp_True'], experiment_paths=experiment_paths),
            'mrglik_optim_0'))
    data['scalars_predcp'] = extract_tensorboard_scalars(log_file=log_file_predcp)

    return data

if args.load_data_from:
    print(f'loading data from {args.load_data_from}')
    data = torch.load(args.load_data_from)
else:
    data = collect_walnut_hyperparams_figure_data(runs)

if args.save_data_to:
    print(f'saving data to {args.save_data_to}')
    torch.save(data, args.save_data_to)

configure_matplotlib()

all_tags = [
        k[:-len('_scalars')] for k in data['scalars'].keys() if k.endswith('_scalars') and (
                k[:-len('_scalars')].rstrip('0123456789') in (
                        'GPprior_variance_', 'GPprior_lengthscale_', 'NormalPrior_variance_') or
                k[:-len('_scalars')] == 'observation_noise_variance')]

tag_list = args.tag_list or all_tags

# GPprior blocks are: In + (num_scales - 1) * Down + (num_scales - 1) * Up
num_scales = (len([t for t in all_tags if t.startswith('GPprior_lengthscale_')]) - 1) // 2 + 1

# NormalPrior blocks are: num_skips * Skip + Out
num_skips = len([t for t in all_tags if t.startswith('NormalPrior_variance_')]) - 1

num_rows, num_cols = args.rows, ceil(len(tag_list) / args.rows)

fig, axs = plt.subplots(num_rows, num_cols,
        figsize=(2.25 * num_cols, 2. * num_rows),
        gridspec_kw={'hspace': args.hspace, 'wspace': args.wspace})
axs = np.atleast_1d(axs).flatten()

def get_block_name(tag_base, idx, num_scales, num_skips):
    block_name = None
    if tag_base in ['GPprior_variance', 'GPprior_lengthscale']:
        if idx == 0:
            block_name = 'In'
        elif idx < 1 + (num_scales - 1):
            block_name = f'Down {idx - 1 + 1}'
        else:
            block_name = f'Up {idx - (1 + (num_scales - 1)) + 1}'
    elif tag_base == 'NormalPrior_variance':
        if idx < num_skips:
            block_name = f'Skip {idx + 1}'
        else:
            block_name = 'Out'
    return block_name

def get_hyperparam_tex_from_tensor_board_tag(tag, include_block_name=True, **kwargs):
    title = None
    if tag == 'observation_noise_variance':
        title = '$\sigma_y^2$'
    elif tag.startswith('GPprior_') or tag.startswith('NormalPrior_'):
        tag_base, idx = tag.rsplit('_', 1)
        idx = int(idx)
        if tag_base == 'GPprior_variance':
            title = f'$\sigma_{{{idx + 1}}}^2$'
        elif tag_base == 'GPprior_lengthscale':
            title = f'$\ell_{{{idx + 1}}}$'
        elif tag_base == 'NormalPrior_variance':
            title = f'$\sigma_{{1\\times 1,{idx + 1}}}^2$'
        if include_block_name:
            title += f' ({get_block_name(tag_base, idx, **kwargs)})'
    return title

for ax, tag in zip(
        axs[[i for i in range(axs.size) if i not in args.skip_sub_plots]], tag_list):
    ax.plot(data['scalars'][f'{tag}_steps'], data['scalars'][f'{tag}_scalars'],
        label='MLL', color=DEFAULT_COLORS['bayes_dip'], alpha=0.9,
        linewidth=2, linestyle='dashed')
    ax.plot(data['scalars_predcp'][f'{tag}_steps'], data['scalars_predcp'][f'{tag}_scalars'],
            label='TV-MAP', color=DEFAULT_COLORS['bayes_dip_predcp'], alpha=0.9,
            linewidth=2, linestyle='dashed')
    ax.set_yscale('log')
    title = get_hyperparam_tex_from_tensor_board_tag(
            tag, num_scales=num_scales, num_skips=num_skips)
    ax.set_title(title)
    ax.tick_params(axis='both', which='major', labelsize='small')
    ax.tick_params(axis='both', which='minor', labelsize='xx-small')
    ax.grid(alpha=0.3)
    ax.spines['top'].set_visible(False)
    ax.spines['right'].set_visible(False)

for i, ax in enumerate(axs):
    if i // num_cols < num_rows - 1 and (i + num_cols) not in args.skip_sub_plots:
        ax.tick_params(labelbottom=False)
    else:
        ax.set_xlabel('iterations', fontsize='small')
    if i in args.skip_sub_plots:
        if i != args.legend_pos:
            ax.remove()
        else:
            ax.set_axis_off()

handles, labels = next(
        ax.get_legend_handles_labels() for i, ax in enumerate(axs)
        if i not in args.skip_sub_plots)
legend_kwargs = {}
if args.legend_bbox_to_anchor:
    legend_kwargs['bbox_to_anchor'] = args.legend_bbox_to_anchor
if args.legend_loc:
    legend_kwargs['loc'] = args.legend_loc
elif args.legend_pos in args.skip_sub_plots:
    legend_kwargs['loc'] = 'center'
axs[args.legend_pos].legend(handles, labels, **legend_kwargs)

suffix = '_' + args.suffix if args.suffix and not args.suffix.startswith('_') else args.suffix
fig.savefig(f'walnut_hyperparams{suffix}.pdf', bbox_inches='tight', pad_inches=0.)
fig.savefig(f'walnut_hyperparams{suffix}.png', bbox_inches='tight', pad_inches=0., dpi=600)
