import os
import json

task = 'LaMP_2'
split = 'dev'
data_path = "data/LaMP/{}/{}/{}_new_test.json".format(task, split, split)
source_list = []
target_list = []
user_list = {}
with open(data_path, 'r') as f:
    for line in f:
        data = json.loads(line)
        user_list[data['id']] = data

data_path = 'data/{}/generation/openai/42_dev.jsonl'.format(task)
id_list = []
with open(data_path, 'r') as f:
    for line in f:
        data = json.loads(line)
        if not data['id'] in id_list:
            id_list.append(data['id'])
print(len(id_list))
input()
new_data_list = []
for id in id_list:
    new_data_list.append(user_list[id])
output_path = 'data/{}/generation/openai/42_test.jsonl'.format(task)
with open(output_path, 'a') as f:
    for data in new_data_list:
        json.dump(data, f)
        f.write('\n')