env1:
    env_name: navigation  
    env_config:
        render_mode: vision
        prompt_format: no_think
        use_state_reward: false
        eval_set: base
    train_size: 10000  
    test_size: 64

env2:
    env_name: navigation  
    env_config:
        render_mode: vision
        prompt_format: no_think
        use_state_reward: false
        eval_set: common_sense
    train_size: 10000  
    test_size: 64