# Default configuration for MARA evaluation

# Required parameters
output_csv: "results.csv"

data_dir: "./python_examples/autumnbench/example_benchmark"

# Model configuration
llm_provider: "openrouter"
model: "google/gemini-flash-1.5"

# Agent configuration
agent: "autumn_llm_unified_interactive_agent_v1" # LLM-based agent
# agent: "autumn_random_interactive_agent_v1" # Random agent
# agent: "autumn_simple_wm_agent" # Oracle autumnSynth agent

use_scratchpad: true
instruction_type: "reflection"
hint: true

oracle_seed: null

logging_path: "./logs"

max_history_length: -1 
stack_frames: true
skip_frames: false
max_interaction_steps: 300
max_steps: 501
render_mode: "text"
seed: 0

task_name: "cd" # mfp, cd, planning
envs: [
    "ice",
]

exp_name: "full_evaluation"

hydra:
  job:
    chdir: true
  run:
    dir: ./experiments/${exp_name}/${now:%Y-%m-%d}/${now:%H-%M-%S}
