import requests
from datasets import Dataset

# URL of the JSON file
url = "https://raw.githubusercontent.com/ericwtodd/function_vectors/main/dataset_files/extractive/adjective_v_verb_3.json"

# Download the JSON data
response = requests.get(url)
data = response.json()

# Add prompt column to each item
for item in data:
    item["prompt"] = f"Here is a list of 3 words. Choose one of them. Answer in one word.\n{item['input']}"
NUM_TRAIN = 1
train = data[:NUM_TRAIN]
val = data[NUM_TRAIN:NUM_TRAIN+100]
test = data[NUM_TRAIN+100:NUM_TRAIN+200]

# Convert to Datasets dataset and save to disk
Dataset.from_list(train).save_to_disk("fv0/train")
Dataset.from_list(val).save_to_disk("fv0/val")
Dataset.from_list(test).save_to_disk("fv0/test")
