name: '/mnt/data/data-selection/data/processed/cohere/cohere_data.jsonl'
split: 'train'
label_column: 'dataset'
data_column: 'messages'
idx_column: 'id'
scores_path: '/mnt/data/data-selection/data/processed/cohere/norm_scores.jsonl'