from .extractor_base import ExtractorBase
from ..utils import get_openai_model_response


GPT4_TRIPLET_EXTRACTION_PROMPT_Q = \
"""Given a question and a candidate answer to the question, please extract a KG from the candidate answer condition on the question and represent the KG with triples formatted with ("head", "relation", "tail").
Please note that this is an EXTRACTION task, so DO NOT care about whether the content of the candidate answer is factual or not, just extract the triplets from it.

Here are some in-context examples:

### Question:
Given these paragraphs about the Tesla bot, what is its alias?

### Candidate Answer:
Optimus (or Tesla Bot) is a robotic humanoid under development by Tesla, Inc. It was announced at the company's Artificial Intelligence (AI) Day event on August 19, 2021.

### KG:
("Optimus", "is", "robotic humanoid")
("Optimus", "under development by", "Tesla, Inc.")
("Optimus", "also known as", "Tesla Bot")
("Tesla, Inc.", "announced", "Optimus")
("Announcement of Optimus", "occured at", "Artificial Intelligence (AI) Day event")
("Artificial Intelligence (AI) Day event", "held on", "August 19, 2021")
("Artificial Intelligence (AI) Day event", "organized by", "Tesla, Inc.")


### Question:
here is some text about Andre Weiss, how many years was Andre at University of Dijon in Paris?

### Candidate Answer:
11 years

### KG:
("Andre Weiss at University of Dijon in Paris", "duration", "11 years")


Now generate the KG for the following candidate answer based on the provided question:

### Question:
{q}

### Candidate Answer:
{a}

### KG:
"""

GPT4_TRIPLET_EXTRACTION_PROMPT = \
"""Given a description of the image, please extract a KG from the text and represent the KG with triples formatted with ("subject", "predicate", "object") with readability, each triplet in a line. If 'and' or 'or' exists in the input sentence, split the objects into multiple triplets. Please do not extract from uninformative sentences.

Here are some in-context examples:

### Input:
Optimus (or Tesla Bot) is a robotic humanoid under development by Tesla, Inc. It was announced at the company's Artificial Intelligence (AI) Day event on August 19, 2021. It is planned to measure 5 ft 8 in (173 cm) tall and weigh 125 lb (57 kg). It is hard to answer whether Tesla is good to invest without more information. 

### KG:
("Optimus", "is", "robotic humanoid") 
("Optimus", "under development by", "Tesla, Inc.") 
("Optimus", "also known as", "Tesla Bot") 
("Tesla, Inc.", "announced", "Optimus") 
("Announcement of Optimus", "occured at", "Artificial Intelligence (AI) Day event") 
("Artificial Intelligence (AI) Day event", "held on", "August 19, 2021") 
("Artificial Intelligence (AI) Day event", "organized by", "Tesla, Inc.") 
("Optimus", "planned to measure", "5 ft 8 in (173 cm) tall")
("Optimus", "planned to measure", "weigh 125 lb (57 kg).")
<Done>

### Input:
The image doesn't provide information about the popularity of the song. The song "Here Comes the Boom" was originally released by American rock band Nelly in 2002 for the soundtrack of the film "The Longest Yard." 

### KG:
("The song 'Here Comes the Boom'", "originally released by", "American rock band Nelly") 
("The song 'Here Comes the Boom'", "released in", "2002") 
("The song 'Here Comes the Boom'", "featured in", "soundtrack of the film 'The Longest Yard'") 
("American rock band Nelly", "released", "The song 'Here Comes the Boom'") 
("The Longest Yard", "had soundtrack featuring", "The song 'Here Comes the Boom'") 
<Done>

Now generate the KG for the provided input text:

### Input:
{input_text}

### KG:
"""


class GPT4Extractor(ExtractorBase):
    def __init__(
        self,
        claim_format:str='triplet'
    ) -> None:
        super().__init__(claim_format=claim_format)
        if self.claim_format == 'triplet':
            self.prompt_temp_wq = GPT4_TRIPLET_EXTRACTION_PROMPT_Q
            self.prompt_temp = GPT4_TRIPLET_EXTRACTION_PROMPT
    
    def extract_claim_triplets(self, response, question=None):
        if question is None:
            prompt = self.prompt_temp.format(
                input_text=response
            )
        else:
            prompt = self.prompt_temp_wq.format(
                q=question,
                a=response
            )
        gpt4_response = get_openai_model_response(
            prompt,
            temperature=0,
            model='gpt-4-1106-preview'
        )
        if gpt4_response and len(gpt4_response):
            kg_str = None
            if '###' in gpt4_response:
                kg_str = gpt4_response[:gpt4_response.index('###')]
            else:
                kg_str = gpt4_response
            triplets = self._parse_claim_triplets(kg_str)
            return triplets
        return []
