verbose: 0
debug: false
# logdir: data/ablation/dpo_vs_sft/alfworld/eval_in_dist
logdir: data/eval/alfworld/dpo_ablation
exact_path: false
num_processes: 1
start_env_idx: 0
max_env_idxs: null
eval_set: eval_out_of_distribution
agents:
  # - type: hf
  #   model_id: meta-llama/Meta-Llama-3.1-8B-Instruct
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: anonymous/Meta-Llama-3-8B-Instruct-sft-alfworld-v1
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: meta-llama/Meta-Llama-3-8B-Instruct
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: anonymous/Meta-Llama-3-8B-Instruct-sft-alfworld-iter0
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: openai
  #   model_id: gpt-4o-mini
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: anonymous/Meta-Llama-3-8B-Instruct-sft-alfworld-iter1
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: anonymous/Meta-Llama-3-8B-Instruct-sft-alfworld-iter1-50-50
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: anonymous/Meta-Llama-3-8B-Instruct-sft-alfworld-iter2
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: anonymous/Meta-Llama-3-8B-Instruct-sft-alfworld-v1
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: google/gemma-2-9b-it
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2
  # - type: hf
  #   model_id: meta-llama/Meta-Llama-3-8B-Instruct
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: mistralai/Codestral-22B-v0.1
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: google/gemma-2-27b-it
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: meta-llama/Meta-Llama-3-70B-Instruct
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: mistralai/Codestral-22B-v0.1
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: anonymous/Meta-Llama-3-8B-Instruct-dpo-lr1e-7-bt0.1-ep0.01-alfworld-iter1
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: openai
  #   model_id: gpt-4o
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: openai
  #   model_id: gpt-4o-mini
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: meta-llama/Meta-Llama-3-8B-Instruct
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: anonymous/Meta-Llama-3-8B-Instruct-sft-alfworld-iter0
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: anonymous/Meta-Llama-3-8B-Instruct-sft-alfworld-iter1
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: save/2409/alfworld_sft_ablation/correction_25/iter1/checkpoint-1055/
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: save/2409/alfworld_sft_ablation/correction_75/iter1/checkpoint-1053/
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: save/2409/alfworld_sft_ablation/correction_0/iter1/checkpoint-800/
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: save/2408/alfworld_sft/iter2/checkpoint-553/
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: save/240907/alfworld_sft_self_correct/iter1/checkpoint-415/
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf
  #   model_id: save/240907/alfworld_sft_self_correct/iter1/checkpoint-415/
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: openai
  #   model_id: gpt-4o-mini
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: hf_space
  #   model_id: meta-llama/Meta-Llama-3-8B-Instruct
  #   space_id: anonymous/anonymous
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  # - type: sglang_server
  #   model_id: meta-llama/Meta-Llama-3-8B-Instruct
  #   server_url: http://localhost:30000/
  #   prompt_template_file: prompts/alfworld/alfworld_template.j2

  - type: hf
    model_id: save/240826/alfworld_dpo_lr5e-7_bt0.1_ep1/iter1/checkpoint-907/
    prompt_template_file: prompts/alfworld/alfworld_template.j2