completion_tokens = prompt_tokens = 0
call_count = 0

old_usage = []

def completions_with_backoff(client, **kwargs):
    return client.chat.completions.create(**kwargs)

def gpt(prompt, model="gpt-4", temperature=0.7, max_tokens=1000, n=1, stop=None, client=None, **kwargs) -> list:
    if isinstance(prompt, str):
        messages = [{"role": "user", "content": prompt}]
    else:
        messages = prompt
    return chatgpt(messages, model=model, temperature=temperature, max_tokens=max_tokens, n=n, stop=stop, client=client, **kwargs)

def chatgpt(messages, model="gpt-4", temperature=0.7, max_tokens=1000, n=1, stop=None, client=None, **kwargs) -> list:
    global completion_tokens, prompt_tokens, call_count
    outputs = []
    call_count += n
    while n > 0:
        cnt = min(n, 20)
        n -= cnt
        res = completions_with_backoff(client, model=model, messages=messages, temperature=temperature, max_tokens=max_tokens, n=cnt, stop=stop, extra_body=kwargs)
        outputs.extend([choice.message.content for choice in res.choices])
        # log completion tokens
        completion_tokens += res.usage.completion_tokens
        prompt_tokens += res.usage.prompt_tokens
    return outputs

def gpt_usage():
    global completion_tokens, prompt_tokens, call_count
    return completion_tokens, prompt_tokens, call_count

def reset_usage():
    global completion_tokens, prompt_tokens, call_count, old_usage
    old_usage.append((prompt_tokens, completion_tokens, call_count))
    completion_tokens = 0
    prompt_tokens = 0
    call_count = 0