#!/usr/bin/env python3
import argparse
import json
import os
import re
from typing import Dict, List, Any, Optional
import time
from openai import APIStatusError  
from concurrent.futures import ProcessPoolExecutor, as_completed
from tqdm import tqdm
from openai import OpenAI
from tools import get_not_fact


def load_data(input_file: str) -> List[Dict]:
    with open(input_file, 'r', encoding='utf-8') as f:
        return json.load(f)


def save_data(output_file: str, data: List[Dict]):
    os.makedirs(os.path.dirname(output_file) if os.path.dirname(output_file) else '.', exist_ok=True)
    with open(output_file, 'w', encoding='utf-8') as f:
        json.dump(data, f, indent=2, ensure_ascii=False)


class LLMHelper:
    def __init__(self, api_key: str, base_url: str, model: str):
        if base_url:
            self.client = OpenAI(api_key=api_key, base_url=base_url)
        else:
            self.client = OpenAI(api_key=api_key)
        self.model = model


    def chat(self, messages: List[Dict[str, str]]) -> str:

        completion = self.client.chat.completions.create(
            model=self.model,
            messages=messages,
            temperature=0,
            top_p=1,
            stream=True,
            stream_options={"include_usage": True}
            )
        content_parts = []
        for chunk in completion:
            if chunk.choices:
                content = chunk.choices[0].delta.content or ""
                content_parts.append(content)
        full_response = "".join(content_parts)

        return full_response

            
# ========== 任务选择 ==========


def translate(llm_helper, item):
    user_prompt="""You are given a logic problem in natural language including a context and a question as follows:
Context: 
${context}
Question: 
${question}

Your final task is to translate the logic problem in natural language into first-order logic formulas. The grammar of first-order logic is defined as follows:
logical conjunction: expr1 ∧ expr2
logical disjunction: expr1 ∨ expr2
logical exclusive disjunction: expr1 ⊕ expr2
logical negation: ¬expr1
expr1 implies expr2: expr1 → expr2
expr1 if and only if expr2: expr1 ↔ expr2
logical universal quantification: ∀ x
logical existential quantification: ∃ x
Output format: logic form ::: description

OTHER RULES:
1.	If a number in a formula contains a decimal point, rewrite it in a parser-safe format. For example, use 423e8 to represent 4.23e10 (no decimal points allowed).
2.	Move all quantifiers to the front. Do not use nested quantifiers. Quantifiers are not allowed to appear inside subformulas of → ∧ ∨ ⊕ ↔. For example, expressions like ∀y ( ... ∃x ... ) → ... are not allowed.
3.	Do not use any symbols other than
['⊕', '∨', '∧', '→', '↔', '∀', '∃', '¬', '(', ')', ',', '='].
For example, symbols such as ≠ are not permitted.
4.	The same symbol must not be used both as a predicate and as a constant. Letter case (uppercase vs lowercase) must not be used as a distinguishing feature; renaming is required. For example, Romance(x) and LanguageFamily(romance) are invalid, because Romance and romance are considered the same symbol.
5.	Variable names must be single lowercase letters.

---------------
Example:
Context: 
All people who regularly drink coffee are dependent on caffeine.
(... more context here ...)
If Rina is not a person dependent on caffeine and a student, then Rina is either a person dependent on caffeine and a student, or a person dependent on caffeine nor a student, or neither a person dependent on caffeine nor a student.

Question: Based on the above information, is the following statement true, false, or uncertain? Rina is either a person who jokes about being addicted to caffeine or is unaware that caffeine is a drug.

Predicates:
Dependent(x) ::: x is a person dependent on caffeine
(... more predicates here ...)
Student(x) ::: x is a student

Premises:
∀x (Drinks(x) → Dependent(x)) ::: All people who regularly drink coffee are dependent on caffeine.

(... more premises here ...)
∀x (Jokes(x) → ¬Unaware(x)) ::: No one who jokes about being addicted to caffeine is unaware that caffeine is a drug.

Conclusion:
Jokes(rina) ⊕ Unaware(rina) ::: Rina is either a person who jokes about being addicted to caffeine or is unaware that caffeine is a drug.
---------------
Return **only** Predicates, Premises, and Conclusion.
Do not include unnecessary symbols such as "**", "numbered lists (like 1., 2., 3., 4.)", " - " etc."""


    context = item.get('context', '')
    user_prompt = user_prompt.replace('${context}', context)
    
    question = item.get('question', '')
    user_prompt = user_prompt.replace('${question}', question)

    system_prompt = "You are an expert in symbolic logic translation. Follow the instructions carefully and provide accurate translations."
     

    messages = [
            {"role": "system", "content": system_prompt},
            {"role": "user", "content": user_prompt}
        ]

    return llm_helper.chat(messages)


def completion(llm_helper, item):

    user_prompt="""This task is to minimally complete the missing logic information so that the solver can successfully infer the conclusion as TRUE. The current logic formulas is incomplete to support a successful proof (e.g., the solver returns “unknown” or “false”).

Please generate as few additional logic information as possible (at least 1 and at most 4). Each set should contain:
•	one natural language sentence, and
•	its corresponding first-order logic formula.
These should:
1.	Express real-world or commonsense knowledge;
2.	Be semantically relevant to the given context and conclusion, and help connect existing predicates and entities;
3.	Be useful for enabling the solver to infer TRUE and complete the proof.

Input:
1.	Natural language context and conclusion;
2.	Symbolic language context and conclusion;
3.	The solver’s proof based on the current symbolic formulas.

Context:
${context}

Conclusion:
${conclusion}

Symbolic Language Translation:
${translation}

Proof:
${reasoning}

---------------
The grammar of first-order logic is defined as follows:
logical conjunction: expr1 ∧ expr2
logical disjunction: expr1 ∨ expr2
logical exclusive disjunction: expr1 ⊕ expr2
logical negation: ¬expr1
expr1 implies expr2: expr1 → expr2
expr1 if and only if expr2: expr1 ↔ expr2
logical universal quantification: ∀ x
logical existential quantification: ∃ x

---------------
Output format:
logic formula ::: natural language sentence (one set per line)

---------------
Example:
Context: 
All squares are four-sided.

Conclusion:
All squares are shapes.

Symbolic Language Translation:
Predicates:\nSquare(x) ::: x is a square.\nFourSided(x) ::: x is four-sided.\nShape(x) ::: x is a shape.\nPremises:\n∀x (Square(x) → FourSided(x))\nConclusion:\n∀x (Square(x) → Shape(x))

Proof:
trying to prove original conclusion:\n1 (all x (Square(x) -> FourSided(x))) # label(non_clause). [assumption].\n2 (all x (Square(x) -> Shape(x))) # label(non_clause) # label(goal). [goal].\n3 -Square(x) | FourSided(x). [clausify(1)].\n4 Square(c1). [deny(2)].\n5 -Shape(c1). [deny(2)].\n6 Derived: FourSided(c1). [resolve(4,a,3,a)].\n-- Search terminated, no contradiction found --\n\ntrying to prove negation of original conclusion:\n1 (all x (Square(x) -> FourSided(x))) # label(non_clause). [assumption].\n2 -(all x (Square(x) -> Shape(x))) # label(non_clause) # label(goal). [goal].\n3 -Square(x) | FourSided(x). [clausify(1)].\n4 -Square(x) | Shape(x). [deny(2)].\n-- Search terminated, no contradiction found --\n\nSo: Unknown

Example Output:
∀x (FourSided(x) → Shape(x)) ::: All four-sided things are shapes.
---------------

Do not include unnecessary symbols such as "**", "numbered lists (like 1., 2., 3., 4.)", " - " etc."""
    
    context = item.get('context', '').replace('\n\n','\n')
    user_prompt = user_prompt.replace('${context}', context)
    
    question = item.get('question', '')
    user_prompt = user_prompt.replace('${conclusion}', question)

    reasoning = item.get('reasoning', '')
    user_prompt = user_prompt.replace('${reasoning}', reasoning)

    trans = item['translation']['FOL']
    user_prompt = user_prompt.replace('${translation}', trans)

    system_prompt = "You are an expert in symbolic logic reasoning. Follow the instructions carefully and provide accurate symbolic language."

    messages = [
            {"role": "system", "content": system_prompt},
            {"role": "user", "content": user_prompt}
        ]
    return llm_helper.chat(messages)


def comple_k_logic(llm_helper, item):

    user_prompt="""This task is to minimally complete the missing logic information so that the solver can successfully infer the conclusion as TRUE. The current logic formulas is incomplete to support a successful proof (e.g., the solver returns “unknown” or “false”).

Please generate as few additional logic information as possible (at least 1 and at most 4). Each set should contain:
•	one natural language sentence, and
•	its corresponding first-order logic formula.
These should:
1.	Express real-world or commonsense knowledge;
2.	Be semantically relevant to the given context and conclusion, and help connect existing predicates and entities;
3.	Be useful for enabling the solver to infer TRUE and complete the proof.

Input:
1.	Natural language context and conclusion;
2.	Symbolic language context and conclusion;
3.	The solver’s proof based on the current symbolic formulas.

Context:
${context}

Conclusion:
${conclusion}

Symbolic Language Translation:
${translation}

Proof:
${old_reasoning}

Note: Adding the following symbolic formula is known to be unsuccessful. You must output different logical information.
${failed_semantic_logic}${reasoning}

---------------
The grammar of first-order logic is defined as follows:
logical conjunction: expr1 ∧ expr2
logical disjunction: expr1 ∨ expr2
logical exclusive disjunction: expr1 ⊕ expr2
logical negation: ¬expr1
expr1 implies expr2: expr1 → expr2
expr1 if and only if expr2: expr1 ↔ expr2
logical universal quantification: ∀ x
logical existential quantification: ∃ x

---------------
Output format:
logic formula ::: natural language sentence (one set per line)

---------------
Example:
Context: 
Some show airing at 8 pm on Monday gives out roses on TV.\nIf a show gives out roses on TV, then the show is an episode of The Bachelor.\nAll shows portraying the lives of real people are reality TV shows.\nBreaking Bad is a show.\nBreaking Bad is not a reality TV show.

Conclusion:
If roses are given out during Breaking Bad, then it is on Monday at 8 pm.

Symbolic Language Translation:
Predicates:\nShow(x) ::: x is a show.\nAiring(x, day, time) ::: x airs on day at time.\nGivesOutRoses(x) ::: x gives out roses on TV.\nEpisodeOf(x, y) ::: x is an episode of y.\nPortrayingRealLives(x) ::: x portrays the lives of real people.\nRealityTV(x) ::: x is a reality TV show.\nPremises:\n∃x (Show(x) ∧ Airing(x, monday, eightPM) ∧ GivesOutRoses(x)) ::: Some show airing at 8 pm on Monday gives out roses on TV.\n∀x (GivesOutRoses(x) → EpisodeOf(x, theBachelor)) ::: If a show gives out roses on TV, then the show is an episode of The Bachelor.\n∀x (PortrayingRealLives(x) → RealityTV(x)) ::: All shows portraying the lives of real people are reality TV shows.\nShow(breakingBad) ::: Breaking Bad is a show.\n¬RealityTV(breakingBad) ::: Breaking Bad is not a reality TV show.\nConclusion:\nGivesOutRoses(breakingBad) → Airing(breakingBad, monday, eightPM) ::: If roses are given out during Breaking Bad, then it is on Monday at 8 pm.

Proof:
trying to prove original conclusion:\n1 (exists x (Show(x) & Airing(x,Monday,EightPM) & GivesOutRoses(x))) # label(non_clause). [assumption].\n2 (all x (GivesOutRoses(x) -> EpisodeOf(x,TheBachelor))) # label(non_clause). [assumption].\n3 (all x (PortrayingRealLives(x) -> RealityTV(x))) # label(non_clause). [assumption].\n4 GivesOutRoses(BreakingBad) -> Airing(BreakingBad,Monday,EightPM) # label(non_clause) # label(goal). [goal].\n5 Show(c1). [clausify(1)].\n6 Airing(c1,Monday,EightPM). [clausify(1)].\n7 GivesOutRoses(c1). [clausify(1)].\n8 -GivesOutRoses(x) | EpisodeOf(x,TheBachelor). [clausify(2)].\n9 -PortrayingRealLives(x) | RealityTV(x). [clausify(3)].\n10 Show(BreakingBad). [assumption].\n11 -RealityTV(BreakingBad). [assumption].\n12 GivesOutRoses(BreakingBad). [deny(4)].\n13 -Airing(BreakingBad,Monday,EightPM). [deny(4)].\n14 Derived: EpisodeOf(c1,TheBachelor). [resolve(8,a,7,a)].\n15 Derived: EpisodeOf(BreakingBad,TheBachelor). [resolve(12,a,8,a)].\n-- Search terminated, no contradiction found --\n\ntrying to prove negation of original conclusion:\n1 (exists x (Show(x) & Airing(x,Monday,EightPM) & GivesOutRoses(x))) # label(non_clause). [assumption].\n2 (all x (GivesOutRoses(x) -> EpisodeOf(x,TheBachelor))) # label(non_clause). [assumption].\n3 (all x (PortrayingRealLives(x) -> RealityTV(x))) # label(non_clause). [assumption].\n4 -(GivesOutRoses(BreakingBad) -> Airing(BreakingBad,Monday,EightPM)) # label(non_clause) # label(goal). [goal].\n5 Show(c1). [clausify(1)].\n6 Airing(c1,Monday,EightPM). [clausify(1)].\n7 GivesOutRoses(c1). [clausify(1)].\n8 -GivesOutRoses(x) | EpisodeOf(x,TheBachelor). [clausify(2)].\n9 -PortrayingRealLives(x) | RealityTV(x). [clausify(3)].\n10 Show(BreakingBad). [assumption].\n11 -RealityTV(BreakingBad). [assumption].\n12 -GivesOutRoses(BreakingBad) | Airing(BreakingBad,Monday,EightPM). [deny(4)].\n13 Derived: EpisodeOf(c1,TheBachelor). [resolve(8,a,7,a)].\n-- Search terminated, no contradiction found --\n\nSo: Unknown

Note: Adding the following symbolic formula is known to be unsuccessful. You must output different logical information.
∀x (EpisodeOf(x, theBachelor) → PortrayingRealLives(x)) ::: All episodes of The Bachelor portray the lives of real people.
∀x (EpisodeOf(x, theBachelor) → RealityTV(x)) ::: All episodes of The Bachelor are reality TV shows.
∀x (RealityTV(x) → ¬(x = breakingBad)) ∨ ∀x (EpisodeOf(x, theBachelor) → Airing(x, monday, eightPM)) ::: Either no reality TV show is Breaking Bad, or all episodes of The Bachelor air on Monday at 8 pm.
Proof has syntax error

Example Output:
∀x (EpisodeOf(x, theBachelor) → PortrayingRealLives(x)) ::: All episodes of The Bachelor portray the lives of real people.
∀x (EpisodeOf(x, theBachelor) → Airing(x, monday, eightPM)) ::: All episodes of The Bachelor air on Monday at 8 pm.
---------------

Do not include unnecessary symbols such as "**", "numbered lists (like 1., 2., 3., 4.)", " - " etc."""
    
    context = item.get('context', '').replace('\n\n','\n')
    user_prompt = user_prompt.replace('${context}', context)
    
    question = item.get('question', '')
    user_prompt = user_prompt.replace('${conclusion}', question)

    reasoning = item.get('old_reasoning', '')
    if type(reasoning)==str:
        if reasoning=='':
            reasoning='Proof has syntax error'
    elif type(reasoning)==list:
        reasoning=reasoning[0]
        if reasoning=='':
            reasoning='Proof has syntax error'
    user_prompt = user_prompt.replace('${old_reasoning}', reasoning)

    trans = item['translation']['FOL']
    if '::: NEW SL' in trans:
        trans = re.sub(r'^.*::: NEW SL\s*\n?', '', trans, flags=re.MULTILINE)
    user_prompt = user_prompt.replace('${translation}', trans)

    if 'old_missing' in item:
        ok_str=''
        for x in range(len(item['old_missing'])):
            tempp=''.join(item['old_missing'][x])
            reasoning=item['old_reasoning'][x+1]
            if reasoning=='':
                reasoning='Proof has syntax error'
            ok_str=ok_str+tempp+reasoning+'\n\n'
            # print(reasoning)
        tempp=''
        for idx in range(len(item['missing_SL'])):
            tempp=tempp+f"{item['missing_SL'][idx]} ::: {item['missing_NL'][idx]}\n"
        reasoning = item.get('reasoning', '')
        if reasoning=='':
            reasoning='Proof has syntax error'
        ok_str=ok_str+tempp+reasoning
        user_prompt = user_prompt.replace('${failed_semantic_logic}${reasoning}', ok_str)
    else:
        reasoning = item.get('reasoning', '')
        if reasoning=='':
            reasoning='Proof has syntax error'
        user_prompt = user_prompt.replace('${reasoning}', reasoning)
        tempp=''
        for idx in range(len(item['missing_SL'])):
            tempp=tempp+f"{item['missing_SL'][idx]} ::: {item['missing_NL'][idx]}\n"
        user_prompt = user_prompt.replace('${failed_semantic_logic}', tempp)

    system_prompt = "You are an expert in symbolic logic reasoning. Follow the instructions carefully and provide accurate symbolic language."

    messages = [
            {"role": "system", "content": system_prompt},
            {"role": "user", "content": user_prompt}
        ]
    # print(user_prompt)

    return llm_helper.chat(messages)


def reality_veri(llm_helper, item):

    user_prompt="""Your task is to determine whether each of the given sentences describes facts that are likely true in the real world.

A sentence is considered TRUE if:
- It describes a fact, tendency, or relationship that is generally accepted as plausible or commonly observed in the real world.
- It reflects everyday knowledge, typical human experience, or widely held beliefs, even if the statement allows for exceptions or is not precisely verifiable.
- It expresses a reasonable causal, functional, or semantic relationship that aligns with how things usually work in real-world contexts.
- For logical inference statements, the connection between antecedent and consequent should be intuitively grounded in real-world understanding, not purely arbitrary.

A sentence is considered NOT TRUE if:
- It involves clearly fictional, impossible, or nonexistent entities.
- It directly contradicts well-established real-world facts.
- It makes a strong universal claim that is clearly false in general.
- It asserts a specific factual claim that is highly implausible or unsupported by common real-world knowledge.

Input: 
Premises is a list of sentences. Each sentence should be evaluated independently.

Premises:
${premise}

Output Format:
True/False (one premise per line)


Return **only** True/False.
Do not include unnecessary symbols such as "**", "numbered lists (like 1., 2., 3., 4.)", " - " etc."""
    
    context=str(item["missing_NL"])
    user_prompt = user_prompt.replace('${premise}', context)
    system_prompt = "You are an AI specialized in evaluating the real-world truth of symbolic-logic premises. Follow the instructions carefully and provide accurate answer."
    

    messages = [
            {"role": "system", "content": system_prompt},
            {"role": "user", "content": user_prompt}
        ]
    
    # print(user_prompt)

    return llm_helper.chat(messages)


def comple_reality(llm_helper, item):

    user_prompt="""You are a knowledge and logic editor for logic reasoning. 
Please minimal revise the non-factual premises and generate fact premises. each should:
1.	Real-world validity: replace all non-factual sentences (i.e., sentences that are false, unreasonable, violate common sense or natural laws, or involve fictional entities).
2.	Enable the proof to be TRUE.
3.	Be semantically relevant to the given context and conclusion, and help connect existing predicates and entities.
   
    
Input:
1.	Natural language context and conclusion;
2.	Symbolic language context and conclusion;
3.	The solver’s proof based on the current symbolic formulas;
4.	Non-factual premises in natural language and symbolic language.


Context:
${context}

Conclusion:
${conclusion}

Symbolic Language Translation:
${translation}

Proof:
${reasoning}

Non-factual premises:
${sentences}

---------------
The grammar of first-order logic is defined as follows:
logical conjunction: expr1 ∧ expr2
logical disjunction: expr1 ∨ expr2
logical exclusive disjunction: expr1 ⊕ expr2
logical negation: ¬expr1
expr1 implies expr2: expr1 → expr2
expr1 if and only if expr2: expr1 ↔ expr2
logical universal quantification: ∀ x
logical existential quantification: ∃ x

Output only the revised premises.
Output format:
logic formulas ::: natural language sentence (one set per line)

---------------

Example Output:
Dependent(x) ::: x is a person dependent on caffeine
∀x (Drinks(x) → Dependent(x)) ::: All people who regularly drink coffee are dependent on caffeine.

---------------
Do not include unnecessary symbols such as "**", "numbered lists (like 1., 2., 3., 4.)", " - " etc."""



    context = item.get('context', '').replace('\n\n','\n')
    for one_premise in item['missing_NL']:
        context=context+'\n'+one_premise
    user_prompt = user_prompt.replace('${context}', context)
    
    question = item.get('question', '')
    user_prompt = user_prompt.replace('${conclusion}', question)

    reasoning = item.get('reasoning', '')
    user_prompt = user_prompt.replace('${reasoning}', reasoning)

    trans = item['translation']['FOL']
    user_prompt = user_prompt.replace('${translation}', trans)

    sentences=''
    llm_judge_list=item['llm_judge'].split('\n')
    false_indexes = [i for i, v in enumerate(llm_judge_list) if v=="False"]
    for idx in false_indexes:
        sentences=sentences+f"{item['missing_SL'][idx]} ::: {item['missing_NL'][idx]}\n"
    user_prompt = user_prompt.replace('${sentences}', sentences)


    system_prompt = "You are an expert in symbolic logic reasoning. Follow the instructions carefully and provide accurate information"
    

    messages = [
            {"role": "system", "content": system_prompt},
            {"role": "user", "content": user_prompt}
        ]
    
    # print(user_prompt)
    

    return llm_helper.chat(messages)


def comple_k_reality(llm_helper, item):

    user_prompt="""You are a knowledge and logic editor for logic reasoning. 
Please minimal revise the non-factual premises and generate fact premises. each should:
1.	Real-world validity: replace all non-factual sentences (i.e., sentences that are false, unreasonable, violate common sense or natural laws, or involve fictional entities).
2.	Enable the proof to be TRUE.
3.	Be semantically relevant to the given context and conclusion, and help connect existing predicates and entities.


Input:
1.	Natural language context and conclusion;
2.	Symbolic language context and conclusion;
3.	The solver’s proof based on the current symbolic formulas;
4.	Non-factual premises in natural language and symbolic language.


Context:
${context}

Conclusion:
${conclusion}

Symbolic Language Translation:
${translation}

Proof:
${reasoning}

Non-factual premises:
${sentences}


Note, below is not fact, You must output different logical information.: 
${pass} 

---------------
The grammar of first-order logic is defined as follows:
logical conjunction: expr1 ∧ expr2
logical disjunction: expr1 ∨ expr2
logical exclusive disjunction: expr1 ⊕ expr2
logical negation: ¬expr1
expr1 implies expr2: expr1 → expr2
expr1 if and only if expr2: expr1 ↔ expr2
logical universal quantification: ∀ x
logical existential quantification: ∃ x

Output only the revised premises.
Output format:
logic formulas ::: natural language sentence (one set per line)

---------------

Example Output:
Dependent(x) ::: x is a person dependent on caffeine
∀x (Drinks(x) → Dependent(x)) ::: All people who regularly drink coffee are dependent on caffeine.

---------------
Do not include unnecessary symbols such as "**", "numbered lists (like 1., 2., 3., 4.)", " - " etc."""



    context = item.get('context', '').replace('\n\n','\n')
    for one_premise in item['missing_NL']:
        context=context+'\n'+one_premise
    user_prompt = user_prompt.replace('${context}', context)
    
    question = item.get('question', '')
    user_prompt = user_prompt.replace('${conclusion}', question)

    reasoning = item.get('reasoning', '')
    user_prompt = user_prompt.replace('${reasoning}', reasoning)

    trans = item['translation']['FOL']
    user_prompt = user_prompt.replace('${translation}', trans)

    sentences=''
    llm_judge_list=item['llm_judge'].split('\n')
    false_indexes = [i for i, v in enumerate(llm_judge_list) if v=="False"]
    for idx in false_indexes:
        sentences=sentences+f"{item['missing_SL'][idx]} ::: {item['missing_NL'][idx]}\n"
    user_prompt = user_prompt.replace('${sentences}', sentences)

    pas=''
    for ok in item['old_missing_fact']:
        pas=pas+''.join(ok)
    user_prompt = user_prompt.replace('${pass}', pas)

    system_prompt = "You are an expert in symbolic logic reasoning. Follow the instructions carefully and provide accurate information"
    

    messages = [
            {"role": "system", "content": system_prompt},
            {"role": "user", "content": user_prompt}
        ]
    
    # print(user_prompt)
    

    return llm_helper.chat(messages)


def worker_process_item(item, api_key, base_url, model, task_type):
    llm_helper = LLMHelper(api_key=api_key, base_url=base_url, model=model)
    result_item = item.copy()

    try:
        if task_type=='trans':
            gpt_output = translate(llm_helper, item)

            cleaned_output = gpt_output.strip()
            cleaned_output = re.sub(r"\n+", "\n", cleaned_output)
            cleaned_output = re.sub(r"\n-", "\n", cleaned_output).replace("**", "").strip()

            result_item['translation'] = {"FOL": cleaned_output}
            return result_item
        
        elif task_type=='comple':
            gpt_output = completion(llm_helper, item)
            cleaned_output = gpt_output.strip()
            cleaned_output = re.sub(r"\n+", "\n", cleaned_output)
            cleaned_output = re.sub(r"\n-", "\n", cleaned_output).replace("**", "").strip()

            missing_SL, missing_NL=[], []
            all_lines=cleaned_output.split('\n')
            for line in all_lines:
                missing_SL.append(line.split(':::')[0].strip())
                missing_NL.append(line.split(':::')[-1].strip())

            result_item['missing_SL'] = missing_SL
            result_item['missing_NL'] = missing_NL
            result_item['old_reasoning']=result_item['reasoning']

            del result_item['final_answer']; del result_item['gold_answer']; del result_item['solver_status']; 
            del result_item['solver_error']; del result_item['reasoning']; 
            return result_item
        
        elif task_type=='comple_k_logic':
            gpt_output = comple_k_logic(llm_helper, item)
            cleaned_output = gpt_output.strip()
            cleaned_output = re.sub(r"\n+", "\n", cleaned_output)
            cleaned_output = re.sub(r"\n-", "\n", cleaned_output).replace("**", "").strip()
            # print(cleaned_output)

            missing_SL, missing_NL=[], []
            all_lines=cleaned_output.split('\n')
            for line in all_lines:
                missing_SL.append(line.split(':::')[0].strip())
                missing_NL.append(line.split(':::')[-1].strip())

            tempp=''
            for idx in range(len(result_item['missing_SL'])):
                tempp=tempp+f"{result_item['missing_SL'][idx]} ::: {result_item['missing_NL'][idx]}\n"

            if 'old_missing' in result_item:
                tempp=[tempp]
                result_item['old_missing'].append(tempp)
            else:
                result_item['old_missing'] = [[tempp]]

            if type(result_item['old_reasoning'])==str:
                result_item['old_reasoning']=[result_item['old_reasoning']]
            result_item['old_reasoning'].append(result_item['reasoning'])

            result_item['missing_SL'] = missing_SL
            result_item['missing_NL'] = missing_NL

            del result_item['final_answer']; del result_item['gold_answer']; del result_item['solver_status']; 
            del result_item['solver_error']; del result_item['reasoning']; 
            return result_item
        
        elif task_type=='reality_veri':
            gpt_output = reality_veri(llm_helper, item)
            cleaned_output = gpt_output.strip()
            cleaned_output = re.sub(r"\n+", "\n", cleaned_output)
            cleaned_output = re.sub(r"\n-", "\n", cleaned_output).replace("**", "").strip()

            result_item['llm_judge'] = cleaned_output
            return result_item
        
        elif task_type=='comple_reality':
            gpt_output = comple_reality(llm_helper, item)
            cleaned_output = gpt_output.strip()
            cleaned_output = re.sub(r"\n+", "\n", cleaned_output)
            cleaned_output = re.sub(r"\n-", "\n", cleaned_output).replace("**", "").strip()

            missing_SL, missing_NL=[], []
            all_lines=cleaned_output.split('\n')
            for line in all_lines:
                missing_SL.append(line.split(':::')[0].strip())
                missing_NL.append(line.split(':::')[-1].strip())

            result_item['missing_SL'] = missing_SL
            result_item['missing_NL'] = missing_NL
            if 'solver_pass_num' not in result_item:
                result_item['solver_pass_num']=0

            tempp=''
            for idx in range(len(result_item['missing_SL'])):
                tempp=tempp+f"{result_item['missing_SL'][idx]} ::: {result_item['missing_NL'][idx]}\n"

            if 'old_missing_fact' in result_item:
                tempp=[tempp]
                result_item['old_missing_fact'].append(tempp)
            else:
                result_item['old_missing_fact'] = [[tempp]]

            return result_item
        
        elif task_type=='comple_k_reality':
            gpt_output = comple_k_reality(llm_helper, item)
            cleaned_output = gpt_output.strip()
            cleaned_output = re.sub(r"\n+", "\n", cleaned_output)
            cleaned_output = re.sub(r"\n-", "\n", cleaned_output).replace("**", "").strip()

            missing_SL, missing_NL=[], []
            all_lines=cleaned_output.split('\n')
            for line in all_lines:
                missing_SL.append(line.split(':::')[0].strip())
                missing_NL.append(line.split(':::')[-1].strip())

            tempp=''
            for idx in range(len(result_item['missing_SL'])):
                tempp=tempp+f"{result_item['missing_SL'][idx]} ::: {result_item['missing_NL'][idx]}\n"
            result_item['old_missing_fact'].append([tempp])

            result_item['missing_SL'] = missing_SL
            result_item['missing_NL'] = missing_NL
            

            return result_item

    except Exception as e:
        result_item["api_error"] = f"ExceptionError: {e}"
        return result_item



# ========== 主逻辑 ==========

def main():
    parser = argparse.ArgumentParser(description='call api')
    parser.add_argument('--input_file', type=str, default='', help='Input JSON file path')
    parser.add_argument('--output_file', type=str, default='', help='Output JSON file path')

    parser.add_argument('--openai_api_key', type=str, default='', help='OpenAI API key')
    parser.add_argument('--openai_base_url', type=str, default='', help='OpenAI API base URL')
    parser.add_argument('--model', type=str, default='', help='Model name')
    parser.add_argument('--num_workers', type=int, default=51, help='')
    parser.add_argument('--task_type', type=str, choices=['trans', 'comple', 'comple_k_logic', 'reality_veri', 'comple_k_reality', 'comple_reality'], default='', help='')

    args = parser.parse_args()
    task_type=args.task_type
    flst=True

    data = load_data(args.input_file)
    results = []

    while flst:
        if os.path.exists(args.output_file):
            yaode_data, exist_id, xin_result=[],[],[]
            results=load_data(args.output_file)
            for item in results:
                cu_id=item['id']
                if 'maskid' in results[0]:
                    cu_id=item['id']+str(item['maskid'])
                if 'api_error' in item:
                    continue
                else:
                    exist_id.append(cu_id)
                    xin_result.append(item)
            for item in data:
                cu_id=item['id']
                if 'maskid' in results[0]:
                    cu_id=item['id']+str(item['maskid'])
                if cu_id not in exist_id:
                    yaode_data.append(item)
            results=xin_result
            data=yaode_data
            print(len(results))

        with ProcessPoolExecutor(max_workers=args.num_workers) as executor:
            futures = [executor.submit(worker_process_item, item, args.openai_api_key, args.openai_base_url, args.model, task_type) for item in data]
            for fut in tqdm(as_completed(futures), total=len(futures), desc="Calling LLM (multiprocess)"):
                result_item = fut.result()
                results.append(result_item)
                save_data(args.output_file, results)

        print(f"\nFinal save to {args.output_file}...")
        save_data(args.output_file, results)
        flst=False
        for checkk in results:
            if 'api_error' in checkk:
                flst=True
                break
            



    if task_type=='comple' or task_type=='comple_k_logic' or task_type=='comple_logic' or task_type=='comple_k_reality' or task_type=='comple_reality':
        new_data=[]
        for item in results:
            tempp=''
            for one_SL in item['missing_SL']:
                tempp=tempp+f"{one_SL} ::: NEW SL\n"
            if '::: NEW SL' in item['translation']['FOL']:
                result = re.sub(r'^.*::: NEW SL\s*\n?', '', item['translation']['FOL'], flags=re.MULTILINE)
                item['translation']['FOL']=result.replace('\nPremises:\n',f'\nPremises:\n{tempp}')
            else:
                item['translation']['FOL']=item['translation']['FOL'].replace('\nPremises:',f'\nPremises:\n{tempp}')
                item['translation']['FOL']=item['translation']['FOL'].replace('\n\n','\n')
            new_data.append(item)
        save_data(args.output_file.replace('.json','_fmt.json'), new_data)

    elif task_type=='reality_veri':
        get_not_fact(args.output_file)


    elif task_type=='trans':
        new_data=[]
        for item in results:
            item['translation']['FOL']=item['translation']['FOL'].replace('  \n','\n')
            item['translation']['FOL']=item['translation']['FOL'].replace('Conclusion\n','Conclusion:\n')
            item['translation']['FOL']=item['translation']['FOL'].replace('Predicates\n','Predicates:\n')
            item['translation']['FOL']=item['translation']['FOL'].replace('Premises\n','Premises:\n')
            if 'Premises' not in  item['translation']['FOL']:
                item['translation']['FOL']='\nPremises:\n'+item['translation']['FOL']
            if 'Conclusion:' not in  item['translation']['FOL']:
                pats='\n'.join(item['translation']['FOL'].split('\n')[:-1])
                con='\nConclusion:\n'+item['translation']['FOL'].split('\n')[-1]
                item['translation']['FOL']=pats+con
            new_data.append(item)
        save_data(args.output_file, new_data)





if __name__ == '__main__':
    main()