[architecture]
learning_rate = 1e-3
hidden_size = 1024
depth = 2
dropout_p = 0.0
batch_size = 2048

[conditioning]
reward_conditioning = True
cumulative_reward_to_go = True

[bootstrapping]
bootstrap_iters = 1
bts_hidden_size = 512
bts_n_layers = 2
bts_n_bins = 301
bts_min_v = 0.0
bts_max_v = 300.0
bts_dropout_p = 0.0
bts_learning_rate = 1e-3
bts_batch_size = 16384
bts_epochs = 10

[training]
epochs = 100
checkpoint_every_n_epochs = 100
val_frac = 0

[analysis]
run_tag = maze2d-rvs-r
analyze_d4rl = True
num_cpu = 1