exp_name: main
task_names: 
prompt_idxs: [0, 5, 10, 15, 20, 25, 30, 35, 40, 45, 50, 55, 60, 65, 70, 75, 80, 85, 90, 95, 100, 105, 110, 115, 120, 125, 130, 135, 140, 145, 150, 155, 160, 165, 170, 175, 180, 185, 190, 195, 200, 205, 210, 215, 220, 225, 230, 235]


models: [
  o1-mini-2024-09-12
] 
resume_model: 0 
system: 
max_tokens: 65536
seed: 12 
num_workers: 100

evaluators: [
  final_match,
  order_consistency,
  order_consistency_loose,
  order_consistency_list,
  order_consistency_first,
  order_invariant,
  order_invariant_loose,
]