import jax
from jax import numpy as jnp

from ProtLig_GPCRclassA.utils import tf_to_jax, tf_to_jraph_graph_reshape

from ProtLig_GPCRclassA.amino_GNN.make_loss_func import make_loss_func, make_aux_loss_func
from ProtLig_GPCRclassA.amino_GNN.make_compute_metrics import make_compute_metrics

def make_train_step(loss_func, init_rngs, reg_loss_func = None, aux_loss_func = None):
    """
    """
    if aux_loss_func is not None:
        def _loss_func(logits, labels):
            return loss_func(logits, labels) + aux_loss_func(logits, labels)
    else:
        _loss_func = loss_func

    if reg_loss_func is not None:
        def train_step(state, batch):
            """
            """
            state = state.replace(rngs = jax.tree_map(lambda x: jax.random.split(x)[0], state.rngs)) # update PRNGKeys
            def loss_fn(params):
                logits = state.apply_fn(params, batch[:-1], deterministic = False, rngs = state.rngs) # TODO init_rngs ???
                loss_val = _loss_func(logits = logits, labels = batch[-1]) + reg_loss_func(params)
                return loss_val, logits
            grad_fn = jax.grad(loss_fn, has_aux = True)
            grads, logits = grad_fn(state.params)
            state = state.apply_gradients(grads = grads) # This handles updates of opt_state and params
            return state, logits, grads
    else:
        def train_step(state, batch):
            """
            """
            state = state.replace(rngs = jax.tree_map(lambda x: jax.random.split(x)[0], state.rngs)) # update PRNGKeys
            def loss_fn(params):
                logits = state.apply_fn(params, batch[:-1], deterministic = False, rngs = state.rngs)
                loss_val = _loss_func(logits = logits, labels = batch[-1])
                return loss_val, logits
            grad_fn = jax.grad(loss_fn, has_aux = True)
            grads, logits = grad_fn(state.params)
            state = state.apply_gradients(grads = grads) # This handles updates of opt_state and params
            return state, logits, grads
    # print('\n\nWARNING: train_step is not jitted.\n\n')
    return train_step
    # return jax.jit(train_step)


def make_train_epoch(is_weighted, loss_option, init_rngs, logger, aux_loss_option = None, reg_loss_func = None, loader_output_type = 'jax', num_classes = 3):
    """
    Helper function to create train_epoch function.
    """
    loss_func = make_loss_func(is_weighted = is_weighted, option = loss_option, num_classes = num_classes)
    if aux_loss_option is not None:
        aux_loss_func = make_aux_loss_func(option = aux_loss_option)
    else:
        aux_loss_func = None
    compute_metrics = make_compute_metrics(loss_func = loss_func, use_jit = False, num_classes = num_classes, aux_loss_func = aux_loss_func)
    train_step = make_train_step(loss_func = loss_func, init_rngs = init_rngs, reg_loss_func = reg_loss_func, aux_loss_func = aux_loss_func)
    # jit:
    train_step = jax.jit(train_step)

    # Case loader outputs jnp.DeviceArray:
    if loader_output_type == 'jax':
        def train_epoch(state, loader):
            batch_metrics = []
            for i, batch in enumerate(loader):
                state, logits, _ = train_step(state, batch)
                metrics = compute_metrics(logits, labels = batch[-1])
                batch_metrics.append(metrics)
            loader.reset()
            return state, batch_metrics
    # Case loader outputs tf.Tensor:
    elif loader_output_type == 'tf':
        def train_epoch(state, loader):
            batch_metrics = []
            for i, batch in loader.enumerate():
                batch = jax.tree_map(lambda x: jax.device_put(tf_to_jax(x), device = jax.devices()[0]), batch)
                batch = batch[0], tf_to_jraph_graph_reshape(batch[1]), batch[2]
                state, logits, _ = train_step(state, batch)
                metrics = compute_metrics(logits, labels = batch[-1])
                batch_metrics.append(metrics)
            return state, batch_metrics
    return train_epoch