import collections
import dataclasses
import logging
import json
import pathlib
from pathlib import Path
from omegaconf import OmegaConf
import imageio
import calvin_env
import hydra
import re
import os
from examples.calvin.multistep_sequences import get_sequences
from examples.calvin.evaluate_utils import (
    get_env_state_for_initial_condition
)
# from online_evaluation_calvin.evaluate_utils import get_env
# from libero.libero import benchmark
# from libero.libero import get_libero_path
# from libero.libero.envs import OffScreenRenderEnv
import numpy as np
from openpi_client import image_tools
from openpi_client import websocket_client_policy as _websocket_client_policy
from tqdm import tqdm
import tyro
import time
# import multiprocessing as multiprocessing
NUM_SEQUENCES = 1000
EP_LEN = 360

@dataclasses.dataclass
class Args:
    #################################################################################################################
    # Model server parameters
    #################################################################################################################
    host: str = "0.0.0.0"
    port: int = 8000
    resize_size: int = 224
    replan_steps: int = 10

    action_type: str = "joint"
    #################################################################################################################
    # LIBERO environment-specific parameters
    #################################################################################################################
    task_suite_name: str = (
        "libero_spatial"  # Task suite. Options: libero_spatial, libero_object, libero_goal, libero_10, libero_90
    )
    num_steps_wait: int = 10  # Number of steps to wait for objects to stabilize i n sim
    num_trials_per_task: int = 50  # Number of rollouts per task

    #################################################################################################################
    # Utils
    #################################################################################################################
    # video_out_path: str = "data/abc_eef_d_joint_90k/videos_pre10"  # Path to save videos
    # eval_dir: str = "data/abc_eef_d_joint_90k/metric_pre10"  # Path to save evaluation results
    # video_out_path: str = "data/d_joint_50k/videos_pre10"  # Path to save videos
    # eval_dir: str = "data/d_joint_50k/metric_pre10"  # Path to save evaluation results
    video_out_path: str = "data/abc_eef_d_joint_experts64_topk4_100k/videos_pre10"  # Path to save videos
    eval_dir: str = "data/abc_eef_d_joint_experts64_topk4_100k/metric_pre10"  # Path to save evaluation results
    # video_out_path: str = "data_calvin_from_scratch/d_joint_80k/videos_pre10"  # Path to save videos
    # eval_dir: str = "data_calvin_from_scratch/d_joint_80k/metric_pre10"  # Path to save evaluation results
    # video_out_path: str = "data/calvin_abc_eef_d_joint_ori_90k/videos_pre10"  # Path to save videos
    # eval_dir: str = "data/calvin_abc_eef_d_joint_ori_90k/metric_pre10"  # Path to save evaluation results
    seed: int = 7  # Random Seed (for reproducibility)

def get_env(dataset_path, obs_space=None, show_gui=True, **kwargs):
    from pathlib import Path

    from omegaconf import OmegaConf

    render_conf = OmegaConf.load(Path(dataset_path) / ".hydra" / "merged_config.yaml")
    if os.path.exists(Path(dataset_path) / ".hydra" / "merged_config.yaml"):
        print("**********************render_conf exists")
    if obs_space is not None:
        exclude_keys = set(render_conf.cameras.keys()) - {
            re.split("_", key)[1] for key in obs_space["rgb_obs"] + obs_space["depth_obs"]
        }
        for k in exclude_keys:
            del render_conf.cameras[k]
    if "scene" in kwargs:
        print("**********************scene exists")
        scene_cfg = OmegaConf.load(Path(calvin_env.__file__).parents[1] / "conf/scene" / f"{kwargs['scene']}.yaml")
        if os.path.exists(Path(calvin_env.__file__).parents[1] / "conf/scene" / f"{kwargs['scene']}.yaml"):
            print("**********************scene_cfg exists")
        OmegaConf.update(render_conf, "scene", scene_cfg)
    if not hydra.core.global_hydra.GlobalHydra.instance().is_initialized():
        hydra.initialize(".")
    env = hydra.utils.instantiate(render_conf.env, show_gui=show_gui, use_vr=False, use_scene_info=True)
    return env


def make_env(dataset_path, show_gui=True, split="validation", scene=None):
    val_folder = Path(dataset_path) / f"{split}"
    print("val_folder:", val_folder)
    if scene is not None:
        env = get_env(val_folder, show_gui=show_gui, scene=scene)
    else:
        env = get_env(val_folder, show_gui=show_gui)

    return env

from collections import Counter
def count_success(results):
    count = Counter(results)
    step_success = []
    for i in range(1, 6):
        n_success = sum(count[j] for j in reversed(range(i, 6)))
        sr = n_success / len(results)
        step_success.append(sr)
    return step_success

def eval_calvin(args: Args) -> None:
    # Set random seed
    np.random.seed(args.seed)


    pathlib.Path(args.video_out_path).mkdir(parents=True, exist_ok=True)
    client = _websocket_client_policy.WebsocketClientPolicy('172.17.0.1', args.port)
    # assert 0 == 1
    # Start evaluation
    conf_dir = Path(f"third_party/calvin/calvin_models") / "conf"
    task_cfg = OmegaConf.load(conf_dir / "callbacks/rollout/tasks/new_playtable_tasks.yaml")
    task_oracle = hydra.utils.instantiate(task_cfg)

    os.makedirs(args.eval_dir, exist_ok=True)
    eval_sr_path = os.path.join(args.eval_dir, "success_rate.txt")

    args.calvin_dataset_path = "/mnt/blob/CALVIN/task_ABCD_D/"
    env = make_env(args.calvin_dataset_path, show_gui=False)
    eval_sequences = get_sequences(NUM_SEQUENCES)
    total_episodes, total_successes = 0, 0
    # # Load val_annotations from JSON file
    # with open('examples/calvin/ann.json', 'r') as f:
    #     val_annotations = json.load(f)
    val_annotations = OmegaConf.load(
        conf_dir / "annotations/new_playtable_validation.yaml"
    )
    print(val_annotations)
    
    results = []
    for seq_ind, (initial_state, eval_sequence) in enumerate(eval_sequences):
        # if sequence_indices and seq_ind not in sequence_indices:
        #     continue
        # if seq_ind in tested_sequence_indices:
        #     continue
        # Get task
        robot_obs, scene_obs = get_env_state_for_initial_condition(initial_state)
        env.reset(robot_obs=robot_obs, scene_obs=scene_obs)
        # action_plan = collections.deque()
        success_counter, video_aggregators = 0, []
        count = 0
        # Get default LIBERO initial states
        for subtask in eval_sequence:
            # print("subtask:", subtask)
            # get lang annotation for subtask
            task_flag = False
            lang_annotation = val_annotations[subtask][0]
            action_plan = collections.deque()
            replay_images = []
            obs = env.get_obs()
            start_info = env.get_info()
            print('------------------------------')
            print(f'task: {lang_annotation}')
            pbar = tqdm(range(EP_LEN))
            for step in pbar:
                img = obs["rgb_obs"]["rgb_static"]
                wrist_img = obs["rgb_obs"]["rgb_gripper"]
                img = image_tools.convert_to_uint8(
                    image_tools.resize_with_pad(img, args.resize_size, args.resize_size)
                )
                wrist_img = image_tools.convert_to_uint8(
                    image_tools.resize_with_pad(wrist_img, args.resize_size, args.resize_size)
                )
                replay_images.append(obs["rgb_obs"]["rgb_static"])
                if not action_plan:
                    # Finished executing previous action chunk -- compute new chunk
                    # Prepare observations dict
                    element = {
                        "observation/image": img,
                        "observation/wrist_image": wrist_img,
                        "observation/state": obs['robot_obs'],
                        "prompt": str(lang_annotation),
                    }
                    # print("obs['robot_obs'].shape", obs['robot_obs'].shape)
                    # Query model to get action
                    action_chunk = client.infer(element)["actions"]
                    assert (
                        len(action_chunk) >= args.replan_steps
                    ), f"We want to replan every {args.replan_steps} steps, but policy only predicts {len(action_chunk)} steps."
                    action_plan.extend(action_chunk[: args.replan_steps])


                action = action_plan.popleft()
                action = action.copy()
                if action[-1] < 0:
                    action[-1] = -1
                else:
                    action[-1] = 1
                # print("actions:", action)
                # time.sleep(10)
                if args.action_type == "eef":
                    assert action.shape[0] == 7
                    curr_action = [action[:3], action[3:6], action[[6]]]
                    action_dict = {
                        "type": "cartesian_abs",
                        "action": curr_action  # 原来的 action 值
                    }
                elif args.action_type == "joint":
                    assert action.shape[0] == 8
                    action_dict = {
                        "type": "joint_abs",
                        "action": action  # 原来的 action 值
                    }
                
                obs, _, _, current_info = env.step(action_dict)

                # check if current step solves a task
                current_task_info = task_oracle.get_task_info_for_set(start_info, current_info, {subtask})
                if len(current_task_info) > 0:
                    print(f"task {subtask} solved at step {step}")
                    task_flag = True
                    break
                # obs['proprio'] = curr_proprio

                # print("action.shape", action.shape)
                # obs, _, _, current_info = env.step(action)
            # if not task_flag:
            #     task_segment = lang_annotation.replace(" ", "_")
            #     imageio.mimwrite(
            #         pathlib.Path(args.video_out_path) / f"rollout_{task_segment}_{count}_{task_flag}.mp4",
            #         [np.asarray(x) for x in replay_images],
            #         fps=30,
            #     )
            # if task_flag:
            #     task_segment = lang_annotation.replace(" ", "_")
            #     imageio.mimwrite(
            #         pathlib.Path(args.video_out_path) / f"rollout_{task_segment}_{count}_{task_flag}.mp4",
            #         [np.asarray(x) for x in replay_images],
            #         fps=30,
            #     )
            count += 1
            if task_flag:
                success_counter += 1
            else:
                # print(f"task {subtask} not solved")
                break
            # assert 0 == 1
        results.append(success_counter)
        success_list = count_success(results)
        with open(eval_sr_path, 'a') as f:
            line =f"{seq_ind}/{NUM_SEQUENCES}: "
            for sr in success_list:
                line += f"{sr:.3f} | "
            # sequence_i += 1
            line += "\n"
            f.write(line)
        # eval_sequences.set_description(
        #     " ".join([f"{i + 1}/5 : {v * 100:.1f}% |" for i, v in enumerate(success_list)]) + "|"
        # )

        
if __name__ == "__main__":
    import multiprocessing
    if multiprocessing.get_start_method(allow_none=True) != "spawn":  
        multiprocessing.set_start_method("spawn", force=True)
    logging.basicConfig(level=logging.INFO)
    # args = 
    eval_calvin(tyro.cli(Args))
