[architecture]
learning_rate = 1e-3
hidden_size = 1024
depth = 2
dropout_p = 0
batch_size = 16384

[training]
max_steps = 20000
checkpoint_every_n_steps = 2000
val_frac = 0.1

[analysis]
run_tag = antmaze-rvs-g
analyze_d4rl = True