from typing import List

import os
import openai

class BaseLLM:
    def __init__(self, template='{}'):
        api_key = os.getenv("OPENAI_API_KEY", "")
        base_url = os.getenv("OPENAI_BASE_URL", "")

        self.client = openai.OpenAI(api_key=api_key, base_url=base_url)

        # Template should contain exactly one {} for correct formatting.
        self.template = template
        assert template.count("{}") == 1

    # @backoff.on_exception(backoff.expo, openai.APIError)
    def completions_with_backoff(self, model: str, **kwargs):
        return self.client.chat.completions.create(model=model, **kwargs)
    
    def llm_inference(self, prompt: str) -> str:
        messages = [{"role": "user", "content": prompt}]
        res = self.completions_with_backoff(
                    model='deepseek-chat',
                    messages=messages,
                    temperature=0.7,
                    max_tokens=8192,
                    n=1,
                    stop=[],
                    top_p=0.95,
                    timeout=300
                )
        
        return res.choices[0].message.content
        

    def generate_response(self, prompt: str) -> str:
        """
        Generates a response to a given prompt.
        """

        response = self.llm_inference(self.template.format(prompt))

        return response


if __name__ == "__main__":
    template = 'Rewrite the following proposition as a single sentence stating one claim, preserving essential content. Exclude intermediate computations—state only the final result.\n\n{}\n\nRespond with the claim only—no preface, labels, quotes, or commentary.'
    prop = 'Total number of ways to pair 12 distinct letters into 6 unordered pairs: Ω = 12!/(6! × 2^6) = 479001600/(720 × 64) = 479001600/46080 = 10395'

    prop_converter = BaseLLM(template)

    response = prop_converter.generate_response(prop)
    print(response)

