defaults:
    - agent: sac

env: cheetah_run

# this needs to be specified manually
exp: delta
experiment: ${exp} #w_model_loss #no_model_update #delta_sac  #velocity_investigation #fixed_mlp #mlp_delta #mlp_debug #delta_sac #pos_only #test_exp

num_train_steps: 2e6
replay_buffer_capacity: ${num_train_steps}


num_seed_steps: 5000 

eval_frequency: 10000
num_eval_episodes: 10

device: cuda


stack_num: 3
latent_dim: 25


# logger
log_frequency: 10000
log_save_tb: False # not loading to tensorboard

# video recorder
save_video: False

seed: 2000


# hydra configuration
hydra:
    name: ${env}
    run:
        dir: ./exp/${now:%Y.%m.%d}/${now:%H%M}_${env}_${seed}_${experiment}
        #dir: ./exp/${now:%Y.%m.%d}/${now:%H%M}_${agent.name}_${experiment}

# only for noisy norm, comment once launch noisy norm experiments
#vel_idx: 3  # 8 for cheetah_run; 15 for walker_run; 3 for cartpole

# only for shared_encoder
encoding_dim: 30
encoder_hidden: 128
encoder_layer: 3
model_update_frequency: 5
predict_reward: 1 # for reward 

# rnn dynamics
hidden_dim: 50
train_length: 8
batch: 64