import json
import logging
import re
from typing import Optional

from src.utility import (
    Record,
    APICall,
    dataset_api_bank,
    APICallStatus,
    API_TOOL_CALL,
    generate_id,
)

api_bank_train_keys = ["instruction", "input", "output"]
api_bank_test_keys = ["file", "id", "instruction", "input", "expected_output"]

api_bank_api_pattern = re.compile(r"\[(\w+)\((.*)\)]")
api_bank_param_name_pattern = re.compile(r"(\w+)=")
api_bank_s_pattern = re.compile(r"\w(')\w")

logger = logging.getLogger(__name__)


def api_bank_process_train_data(record: dict) -> Optional[Record]:
    """
    Convert API-Bank training instance to Record object.
    :param record: Dict based API-Bank training data instance.
    :return: Training data instance in format of Record object.
    """
    # instruction is like: 'Generate an API request in the format of ...\nAPI descriptions:\n'
    instruction = record["instruction"]
    # fix typo in original API Bank data
    instruction = instruction.replace("utterence", "utterance")
    lines = [x.strip() for x in instruction.split("\n")]
    pre_api = [x for x in lines if len(x) > 0]

    # input is like: '{"apiCode": "send_help_alert"...}\nUser: I need to ...\nGenerate API Request:'
    input_lines = record["input"]
    # make train data api definition keys consistent with test data
    input_lines = (
        input_lines.replace('"apiCode":', '"name":')
        .replace('"parameters":', '"input_parameters":')
        .replace('"response":', '"output_parameters":')
    )
    input_lines = [x.strip() for x in input_lines.split("\n")]
    api = []
    conversation = []
    ending = []
    for line in input_lines:
        if len(line) == 0:
            continue
        if line.startswith("{"):
            api.append(line)
        else:
            if line.startswith("Generate API Request:"):
                ending.append(line)
            else:
                conversation.append(line)

    # output is like: 'API-Request: [schedule_appointment(...'
    output = record["output"]

    api_call = api_bank_str_to_api_call(output, False)
    if api_call is None:
        return None
    template_output = api_bank_api_call_to_template(api_call)

    return Record(
        id=generate_id(
            str(record["instruction"]) + str(record["input"]) + str(record["output"])
        ),
        data_set=dataset_api_bank,
        pre_api=pre_api,
        api_def=api,
        conversation=conversation,
        ending=ending,
        output=output,
        post_api=[],
        api_call=APICallStatus(api_call_status=API_TOOL_CALL, api_calls=[api_call]),
        template_output=[template_output],
    )


def api_bank_process_test_data(record: dict) -> Optional[Record]:
    """
    Convert API-Bank test instance to Record object.
    :param record: Dict based API-Bank test data instance.
    :return: Test data instance in format of Record object.
    """
    # instruction is like: 'Generate an API request in the format of ...\nAPI descriptions:\n{"name":...'
    instruction = record["instruction"]
    # fix typo in original API Bank data
    instruction = instruction.replace("utterence", "utterance")
    lines = [x.strip() for x in instruction.split("\n")]
    api_reached = False
    pre_api = []
    api = []
    for line in lines:
        if len(line) == 0:
            continue
        if api_reached:
            api.append(line)
        else:
            pre_api.append(line)
        if line.startswith("API descriptions"):
            api_reached = True

    # input is like: 'User: I need to ...\nGenerate API Request:'
    input_lines = record["input"]
    input_lines = [x.strip() for x in input_lines.split("\n")]
    conversation = []
    ending = []
    for line in input_lines:
        if len(line) == 0:
            continue
        if line.startswith("Generate API Request:"):
            ending.append(line)
        else:
            conversation.append(line)

    # output is like: API-Request: [schedule_appointment(...
    output = record["expected_output"]

    api_call = api_bank_str_to_api_call(output)
    if api_call is None:
        return None
    template_output = api_bank_api_call_to_template(api_call)

    return Record(
        id=f'{record["file"]}_{record["id"]}',
        data_set=dataset_api_bank,
        pre_api=pre_api,
        api_def=api,
        conversation=conversation,
        ending=ending,
        output=output,
        post_api=[],
        api_call=APICallStatus(api_call_status=API_TOOL_CALL, api_calls=[api_call]),
        template_output=[template_output],
    )


def api_bank_process_data(records: list[dict]) -> list[Record]:
    """
    Convert API-Bank data instances to Record objects.
    :param records: List of dict based API-Bank data instance.
    :return: List of Record containing API-Bank data instance.
    """
    new_records = []
    for record in records:
        if sorted(record.keys()) == sorted(api_bank_test_keys):
            new_record = api_bank_process_test_data(record)
        elif sorted(record.keys()) == sorted(api_bank_train_keys):
            new_record = api_bank_process_train_data(record)
        else:
            raise RuntimeError(f"Unable to parse:{record}")
        if new_record is None:
            continue
        new_records.append(new_record)
    return new_records


def api_bank_parse_api_request(api_request: str) -> Optional[APICall]:
    """
    Parse the API response string to create a APICall object.
    :param api_request: String based API response.
    :return: APICall object. None if failed to parse.
    """
    # input is like: [AddMeeting(end_time='2023-11-12 16:00:00', location='conference room', attendees=['John', 'Jane'])]
    match = api_bank_api_pattern.match(api_request)
    if match is None:
        logger.info("Unable to match API request:" + api_request)
        return None

    # api_name is like: AddMeeting
    api_name = match.group(1)
    # params is like: end_time='2023-11-12 16:00:00', location='conference room', attendees=['John', 'Jane']
    params = match.group(2)

    # truth file contains some record like "health_data='[{...},...]'", remove the single quote
    params = params.replace("'[", "[").replace("]'", "]")

    # add quote to name: "end_time"='2023-11-12 16:00:00', "location"='conference room', "attendees"=['John', 'Jane']
    params = api_bank_param_name_pattern.sub(r'"\1"=', params)
    # replace quote with colon: "end_time":'2023-11-12 16:00:00', "location":'conference room', "attendees":['John', 'Jane']
    params = params.replace("=", ":")
    # handle 's
    params = api_bank_s_pattern.sub(r"\\\1", params)
    # add curly braces
    params = "{" + params + "}"
    try:
        # parse with json
        params_json = json.loads(json.dumps(eval(params)))
    except:
        return None
    return APICall(
        api_name=api_name,
        params=params_json,
    )


def api_bank_extract_api_request_str(response: str) -> Optional[str]:
    """
    Extract API string from raw response.
    :param response: Response from models.
    :return: A string contains API call.
    """
    # input is like: "API-Request: [EmergencyKnowledge(symptom='Fatigue')]"
    if response is None or len(response) == 0:
        return None
    response = response.strip()
    if len(response) > 2 and response[0] == "[" and response[-1] == "]":
        return response
    prefix = "API-Request: ["
    prefix_index = response.find(prefix)
    if prefix_index < 0:
        # try to match case like "API-Request: EmergencyKnowledge(symptom='Fatigue')"
        leftover = f'[{response.removeprefix("API-Request: ")}]'
        try_match = api_bank_parse_api_request(leftover)
        if try_match is not None:
            return leftover
        return None
    start_idx = prefix_index + len(prefix) - 1
    end_idx = response.rfind("]")
    if end_idx < 0:
        return None
    # returned value is like: [EmergencyKnowledge(symptom='Fatigue')]
    return response[start_idx : end_idx + 1]


def api_bank_str_to_api_call(
    input_str: str, raise_error_on_failure: bool = True
) -> Optional[APICall]:
    """
    Parse APICall object from a string.
    :param input_str: String based API call information.
    :param raise_error_on_failure: Raise error if failed to parse APICall object.
    :return: Parsed APICall object.
    """
    requests_str = api_bank_extract_api_request_str(input_str)
    if requests_str is None:
        message = f"Failed to parse string to API-Bank API call: {input_str}"
        logger.error(message)
        if raise_error_on_failure:
            raise RuntimeError(message)
        else:
            return None
    api_call = api_bank_parse_api_request(requests_str)
    if api_call is None:
        message = f"Failed to parse API-Bank APICall: {input_str}"
        logger.error(message)
        if raise_error_on_failure:
            raise RuntimeError(message)
    return api_call


api_bank_no_param_format = "Call the `{}` API with no parameter"
api_bank_prefix_format = "Call the `{}` API with following parameters: "
api_bank_param_format = "`{}` as `{}`"


def api_bank_api_call_to_template(api_call: APICall) -> str:
    """
    Convert APICall object to a template based string.
    :param api_call: APICall object to convert.
    :return: Template based string to describe APICall.
    """
    if len(api_call.params) == 0:
        result = api_bank_no_param_format.format(api_call.api_name)
    else:
        param_values = []
        for k, v in api_call.params.items():
            param_values.append(api_bank_param_format.format(k, v))
        param_str = ", ".join(param_values)
        result = api_bank_prefix_format.format(api_call.api_name) + param_str
    return result
