[base]
package = atari
env_name = pong
rnn_name = Recurrent

[train]
total_timesteps = 5_000_000
batch_size = 32768
minibatch_size = 1024
update_epochs = 2
bptt_horizon = 8
learning_rate = 0.0006112614226003401
gae_lambda = 0.9590507508564148
gamma = 0.9671759718055382
ent_coef = 0.01557519441744131
clip_coef = 0.3031963355045393
vf_clip_coef = 0.13369578727174328
vf_coef = 0.9274225135298954
max_grad_norm = 1.392141580581665

[env]
frameskip = 4
repeat_action_probability = 0.0
