task_name: ""

# model parameters
model_type: radt # radt, dt, dc, star_rwd_rtg
embed_dim: 128
n_layer: 3
n_head: 1
activation_function: gelu
dropout: 0.1
remove_act_embs: False
learning_rate: 1e-4
weight_decay: 1e-4
K: 20 # 20 for dt, radt, 8 for dc
timestep_sampling: True

dc:
  conv_window_size: 6

radt:
  stepra: True
  adaptive_scale: True
  seqra: True
  action_tanh: True

# training parameters
seed: 0
env: ant
dataset: medium-replay # medium, medium-replay, medium-expert, expert
mode: normal # normal for standard setting, delayed for sparse, no-reward-decay
validation_mode: align # best, align
device: cuda
pct_traj: 1.
batch_size: 64
warmup_steps: 10000
num_iterations: 100_000
eval_every: 5000
eval_targets: []
num_eval_episodes: 10
test_targets: []
num_test_episodes: 100
nstep: 0

# evaluation parameters
clip_action: False

# logging parameters
defaults:
  - paths: default
  - hydra: default
  - target_returns: default

computation_cost: False
