[architecture]
learning_rate = 1e-3
hidden_size = 1024
depth = 1
dropout_p = 0.0
batch_size = 1024

[training]
max_steps = 30000
checkpoint_every_n_steps = 3000
val_frac = 0.1

[analysis]
run_tag = antmaze-rvs-g
analyze_d4rl = True
