from config import PERSISTENT_DATA_PATH, MY_DEBUG
from Testers.CliffWalkingTest import CliffWalkingVerifier, CliffWalkingDirectionalityVerifier
from Testers.HierachyCraftTest import HierachyCraftVerifier
from Testers.MiniGridTest import *
import argparse
from Testers.ALFTest import ALFVerifier
from Testers.RobomimicTest import RobomimicVerifier
from config import all_condition_list
verifier_dict = {
        "MiniGrid-DoorKey-5x5-v0": DoorKeyVerifier,
        "MiniGrid-FourRooms-v0": FourRoomsVerifier,
        "ALFWorld": ALFVerifier,
        "HCraft": HierachyCraftVerifier,
        "robomimic": RobomimicVerifier,
        "CliffWalking": CliffWalkingVerifier,
        "CliffWalkingDirectionality": CliffWalkingDirectionalityVerifier
    }
if __name__ == "__main__":
    parser = argparse.ArgumentParser(description="Language Model verifier")
    parser.add_argument('--env', type=str, help="domain", default="MiniGrid-DoorKey-5x5-v0")
    # Adding arguments
    parser.add_argument('--type', type=str, help="Feedback type", default="binary_feedback")  # Required positional argument
    parser.add_argument('--distribution', type=str, default="1",
                        help="Expert percentage in sampling distribution")  # Optional argument with default
    parser.add_argument('--source', type=str, default="vec-inf",
                        help="Inference backend")
    parser.add_argument('--url', type=str, default="http://gpu005:8080/v1",
                        help="Inference backend url")
    parser.add_argument('--model', type=str, default="Meta-Llama-3.1-8B-Instruct",
                        help="Model")
    parser.add_argument('--rounds', type=int, default=1, help="rounds of each state/action to get responses")
    parser.add_argument('--egocentric', type=bool, default=False, help="use egocentric observation")
    parser.add_argument('--known_dynamics', type=bool, default=False, help="use known dynamics")
    parser.add_argument('--explicit_action_by_action_cot', type=bool, default=False, help="use explicit action by action cot")
    parser.add_argument('--explicit_thinking_guides', type=bool, default=False,
                        help="use explicit thinking guides")
    parser.add_argument('--max_item_num', type=int, default=-1, help="maximum of data entries to test, -1 means all")
    parser.add_argument("--start_from", type=str, default="", help="start from a previous file")

    parser.add_argument("--uniform_sampling", type=bool, default=False, help="uniform sampling")
    parser.add_argument("--skip_neutral", type=bool, default=False, help="skip neutral preference")
    parser.add_argument("--api_key", type=str, default="", help="api key")
    parser.add_argument('--explain_legal_action_dynamics', type=bool, default=False,
                        help="In HCraft: explain legal action dynamics")
    parser.add_argument('--only_expert_path_dynamics', type=bool, default=False)
    parser.add_argument('--text_rendering', type=bool, default=False, help="text rendering for robomimic")
    parser.add_argument('--OLAF_style_delta_action', type=bool, default=False, help="robomimic, OLAF style delta action")
    parser.add_argument("--purpose", type=str, default="", help="purpose of the test, for logging")
    parser.add_argument("--load_prompt_from_config", type=str, default="", help="load prompt from config file, by default check under /prompts/ folder")
    parser.add_argument("--data_filter", type=str, default="", help="filter data by functions, the names are provided by = seperated str of function names in utils.py")
    parser.add_argument("--XYZ_only", type=bool, default=False, help="robomimic only check xyz for delta action")
    parser.add_argument("--history_context", type=bool, default=False, help="append history context")
    parser.add_argument("--unknown_dynamics", type=bool, default=False, help="use unknown dynamics")
    parser.add_argument("--debug_print", type=bool, default=False, help="print debug info")
    parser.add_argument("--ICL", type=bool, default=False, help="In Context Learning")
    parser.add_argument("--pair_preference", type=bool, default=False, help="ensure preferences come in pairs, A>B and B>A")
    parser.add_argument("--number_threads", type=int, default=1, help="number of threads to use when query api")
    # parser.add_argument("--use_weave", type=bool, default=True, help="use weave to log")
    parser.add_argument("--task_prompt", type=bool, default=False, help="use task prompt to say you gonna be asked blah blah")
    parser.add_argument("--XYZ_gripper", type=bool, default=False, help="robomimic only check xyz gripper")
    parser.add_argument("--check_prompt", type=bool, default=False, help="just check the prompt")
    parser.add_argument("--path", type=str, default="", help="arbitary load path")
    parser.add_argument("--image_observation", type=bool, default=False, help="use image observation for MiniGrid")
    args = parser.parse_args()

    if args.debug_print == True:
        print("Debug mode on")
        config.MY_DEBUG = True

    #TODO Move this in config.py
    path_dict = {
        "MiniGrid-DoorKey-5x5-v0": PERSISTENT_DATA_PATH + "/Doorkey/doorkey_{type}_{distribution}.npy".format
            (type=args.type, distribution=args.distribution),
        "MiniGrid-FourRooms-v0": PERSISTENT_DATA_PATH + "/FourRooms/FourRooms{type}_{distribution}.npy".format
            (type=args.type, distribution=args.distribution),
        "ALFWorld": PERSISTENT_DATA_PATH + "/ALF/ALF{type}_{distribution}.npy".format(type=args.type, distribution=args.distribution),
        "HCraft": PERSISTENT_DATA_PATH + "/HierachyCraft/HierachyCraft{type}_{distribution}.npy".format(type=args.type, distribution=args.distribution),
        "robomimic": PERSISTENT_DATA_PATH + "/robomimic/robomimic{type}_{distribution}.npy".format(type=args.type, distribution=args.distribution),
        "CliffWalking": PERSISTENT_DATA_PATH + "/CliffWalking/cliffwalking_{type}_{distribution}.npy".format(type=args.type, distribution=args.distribution),
        "CliffWalkingDirectionality": PERSISTENT_DATA_PATH + "/CliffWalkingDirectionality/cliffwalking_directionality_{type}_{distribution}.npy".format(type=args.type, distribution=args.distribution)
    }
    print(args)
    condition_list = []
    for condition in all_condition_list:
        if getattr(args, condition):
            condition_list.append(condition)

    default_system_prompt = "You are an expert game player"
    robomimic_system_prompt = "You are a professional robot engineer."

    system_prompt_dict = {
        "MiniGrid-DoorKey-5x5-v0": default_system_prompt,
        "MiniGrid-FourRooms-v0": default_system_prompt,
        "ALFWorld": default_system_prompt,
        "HCraft": default_system_prompt,
        "robomimic": robomimic_system_prompt,
        "CliffWalking": default_system_prompt,
        "CliffWalkingDirectionality": default_system_prompt
    }

    verifier = verifier_dict[args.env]
    instance_verifier = verifier(args.env, args.type, path_dict[args.env] if args.path == "" else args.path, condition_list, purpose_str=args.purpose, system_prompt=system_prompt_dict[args.env], data_filter=args.data_filter)
    if args.load_prompt_from_config != "":
        if args.load_prompt_from_config[0] == "/":
            prompt_config_path = args.load_prompt_from_config
        else:
            prompt_config_path = f"{PROMPT_CONFIG_PATH}/{args.load_prompt_from_config}"
        instance_verifier.load_prompt_from_config(prompt_config_path)
    if args.check_prompt:
        instance_verifier.check_prompt(max_item_num=args.max_item_num, skip_neutral=args.skip_neutral)
    else:
        results = instance_verifier.verify(args.rounds, args.source, url=args.url, model=args.model, max_item_num=args.max_item_num, start_from=args.start_from, uniform_sampling=args.uniform_sampling, skip_neutral=args.skip_neutral, api_key=args.api_key, pair_preference=args.pair_preference, numer_of_thread=args.number_threads)
