from datasets import load_dataset, Dataset
from ast import literal_eval
from transformers import AutoTokenizer



livebench = load_dataset("livebench/coding")

def proccess_tests(row):
    row['public_test_cases'] = literal_eval(row['public_test_cases'])
    return row
    
livebench = livebench.map(proccess_tests)

tokenizer = AutoTokenizer.from_pretrained("Qwen/Qwen2.5-Coder-7B-Instruct")

def add_prompt(row):
    
    prompt =  "Solve the following problem:\n\n" + row['original_json']['question_content']
    starter_code = row.get('original_json', {}).get('starter_code', '')
    
    if starter_code != '':
        prompt += "\n\nFormat:You will use the following starter code to write the solution to the problem and enclose your code within delimiters\n```python\n" + starter_code + "\n```"
   
    messages = [
    {"role": "system", "content": "You are a coding assistant.  Your task is to output ONLY valid code for the given task.  Do not include explanations, comments, markdown formatting (```), or natural language.  Output exactly and only the code required. Use input() to input and print() to output."},
    {"role": "user", "content": prompt}
        ]
    text = tokenizer.apply_chat_template(
        messages,
        tokenize=False,
        add_generation_prompt=True
    )
    
    row['prompt'] = text
    return row

livebench = livebench.map(add_prompt)
livebench = livebench.filter(lambda x: len(tokenizer.tokenize(x['prompt'])) < 512)


livebench.save_to_disk('datasets/livebench')

