import logging
from pathlib import Path

_logger = logging.getLogger(__name__)

try:
    import lm_eval
    from lm_eval.models.huggingface import HFLM
    from lm_eval.evaluator import EvaluationTracker
except ImportError:
    _logger.warning('lm_eval library is not installed. Cannot use lm_eval.')

DEFAULT_HARNESS_TASKS = ["hellaswag", "lambada_standard", "arc_challenge", "mmlu", "siqa", "piqa", "winogrande", "wikitext"]

def wrap_hf_model(model, tokenizer, max_length=2048):
    return HFLM(
        pretrained=model,
        tokenizer=tokenizer,
        max_length=max_length,
        trust_remote_code=True,
    )


def evaluate_with_harness(
        model,
        tokenizer,
        tasks=tuple(DEFAULT_HARNESS_TASKS),
        apply_chat_template=False,
        log_path=None
):
    lm_obj = wrap_hf_model(model, tokenizer)
    _logger.info(Path(__file__).parent / "custom_tasks")
    task_manager = lm_eval.tasks.TaskManager(include_path=str(Path(__file__).parent / "custom_tasks"))
    eval_args = dict(
        model=lm_obj,
        tasks=list(tasks),
        task_manager=task_manager,
        apply_chat_template=apply_chat_template,
    )
    if log_path is not None:
        eval_args["evaluation_tracker"] = EvaluationTracker(output_path=log_path)
        eval_args["model_args"] = ""

    results = lm_eval.simple_evaluate(**eval_args)

    return results["results"]

