[base]
package = pokemon_red
env_name = pokemon_red

[train]
total_timesteps = 1_000_000
num_envs = 96
num_workers = 24
env_batch_size = 32
zero_copy = False
update_epochs = 3
gamma = 0.998
batch_size = 65536
minibatch_size = 2048
compile = True
learning_rate = 2.0e-4
anneal_lr = False
