experiment:
    project: "alfworld_eval"
    num_node: 1 # the number of machines you have
    node_index: 0 # no need to change


# only need to be set when using multi-nodes
system:
    HTTP_PROXY: # your proxy
    HF_HOME: # hf_home
    env_name: # name of env
    envs_dir: # env_dir
    rl_base_dir: # your base dir

model: # model path

dataset:
    environment_type: "alfworld"
    alfworld_data_type: "eval_in_distribution" # "train" "eval_in_distribution" "eval_out_of_distribution"
    environment_file_dir: "/absolute/path/to/alfworld_master"
    environment_data_dir: where you download the alfworld-data 


rollout:
    env_max_parallel: 256
    num_rollout_per_trial: 4
    max_interaction_step: 60
    temperature: 0.6
    model_length: 20000
    max_gen_length: 2000
    gpu_groups: [[0,1,2,3],[4,5,6,7]]
    if_start_with_think: False
    



