import csv
import json
import jsonlines

def question_read(text_file):
    dataset = []
    file = open(text_file, "r")
    data = list(csv.reader(file, delimiter=","))
    file.close()
    num = len(data)
    for i in range(num):
        dataset.append(data[i][0])
    
    return dataset


with open("../ft_datasets/pure_bad_dataset/mixed_10_prefixed.jsonl","r") as f:
    lines = f.readlines()

data = [json.loads(line) for line in lines]

print(len(data))

print(data[0])
# for i in range(len(data)):
#     if i<100:
#         data[i]["prefixed"]=0
#     else:
#         data[i]["prefixed"]=1

# print(data[99])

# with jsonlines.open("../ft_datasets/pure_bad_dataset/mixed_10_prefixed.jsonl","w") as f:
#     for i in data:
#         f.write(i)


with open("training.csv","w") as csvfile: 
    writer = csv.writer(csvfile)
    for i in data[0:100]:
        writer.writerow([i["messages"][0]["content"]])