import os
import torch
from model import SEDD
import utils
from model.ema import ExponentialMovingAverage
import graph_lib
import noise_lib

from omegaconf import OmegaConf

def load_model_hf(dir, device):
    score_model = SEDD.from_pretrained(dir).to(device)
    graph = graph_lib.get_graph(score_model.config, device)
    noise = noise_lib.get_noise(score_model.config).to(device)
    return score_model, graph, noise


def load_model_local(root_dir, device, specific_checkpoint=None):
    cfg = utils.load_hydra_config_from_run(root_dir)
    graph = graph_lib.get_graph(cfg, device)
    noise = noise_lib.get_noise(cfg).to(device)
    score_model = SEDD(cfg).to(device)
    ema = ExponentialMovingAverage(score_model.parameters(), decay=cfg.training.ema)
    if specific_checkpoint is not None:
        ckpt_dir = os.path.join(root_dir, "checkpoints", specific_checkpoint)
    else:
        ckpt_dir = os.path.join(root_dir, "checkpoints-meta", "checkpoint.pth")
    loaded_state = torch.load(ckpt_dir, map_location=device, weights_only=False)
    if cfg.distill.is_distill:
        score_model.load_state_dict(loaded_state['student'])
        ema.load_state_dict(loaded_state['ema_student'])
    else:
        score_model.load_state_dict(loaded_state['model'])
        ema.load_state_dict(loaded_state['ema'])

    ema.store(score_model.parameters())
    ema.copy_to(score_model.parameters())
    return score_model, graph, noise


def load_model(root_dir, device, specific_checkpoint = None):
    try:
        return load_model_hf(root_dir, device)
    except:
        return load_model_local(root_dir, device, specific_checkpoint=specific_checkpoint)