import os
import sys

sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), os.path.pardir)))
print(os.path.abspath(os.path.join(os.path.dirname(__file__), os.path.pardir)))

from A_data_preprocess.util.data import create_few_shots

file_path = "/data/home10b/wlj/code/ICLR2025/data"  #sys.argv[1]
# for tydiqa
# create_few_shots(dataset_name='tydiqa', file_path=file_path, src_l=["en"], k=4, n_clusters=20, seeds=[32, 100, 44],
#                  set_up='random', mode='test')
# create_few_shots(dataset_name='tydiqa', file_path=file_path, src_l=["en"], k=4, n_clusters=20, seeds=[32],
#                  set_up='sim_in_cross', mode='test')
create_few_shots(dataset_name='tydiqa', file_path=file_path, src_l=["en"], k=4, n_clusters=20, seeds=[32,44,100],
                 set_up='cluster_in_cross', mode='train')

# # for xcopa
# create_few_shots(dataset_name='xcopa', file_path=file_path, src_l=["en","zh","it"], k=4, n_clusters=5, seeds=[32, 100, 44],
#                  set_up='random', mode='test')
# create_few_shots(dataset_name='xcopa', file_path=file_path, src_l=["en"], k=4, n_clusters=5, seeds=[32],
#                  set_up='sim_in_cross', mode='test')
create_few_shots(dataset_name='xcopa', file_path=file_path, src_l=["en"], k=4, n_clusters=5, seeds=[32, 100, 44],
                 set_up='cluster_in_cross', mode='train')
# create_few_shots(dataset_name='xcopa', file_path=file_path, src_l=["zh","it"], k=4, n_clusters=5, seeds=[32, 100, 44],
#                  set_up='cluster_in_cross', mode='train')

# for xnli
# create_few_shots(dataset_name='xnli', file_path=file_path, src_l=["en"], k=4, n_clusters=20, seeds=[32, 100, 44],
#                  set_up='random', mode='test')
# create_few_shots(dataset_name='xnli', file_path=file_path, src_l=["en"], k=4, n_clusters=20, seeds=[32],
#                  set_up='sim_in_cross', mode='test')
create_few_shots(dataset_name='xnli', file_path=file_path, src_l=["en"], k=4, n_clusters=20, seeds=[32, 100, 44],
                 set_up='cluster_in_cross', mode='train')