exp_name: level/short
task_names: 
prompt_idxs: 


models: [
 llama3.2-90b-vision,
    mistral-large-2407,
] 
resume_model: 0 
system: 
max_tokens: 8192
seed: 12 
num_workers: 20

evaluators: [
  final_match,
  order_consistency,
  order_consistency_loose,
  order_consistency_list,
  order_consistency_first,
  order_invariant,
  order_invariant_loose,
]