kind: "CDT"
learning_starts: 0
batch_size: 128
gradient_steps: 1
stochastic_policy: False
loss_fn: "mse"
eval_context_len: 20
ent_coef: 0.0
offline_steps: ${run_params.total_timesteps}
buffer_max_len_type: "transition"
buffer_size: 80000000 # 8e7
buffer_weight_by: len 
target_return_type: predefined
warmup_steps: 4000
replay_buffer_kwargs:
  num_workers: 16
  pin_memory: False
cache_kwargs:
  num_workers: 0
  prefetch_factor: null
  pin_memory: False
  init_top_p: 0.01
use_amp: True 
compile: True
load_path:
  dir_path: ${MODELS_DIR}/d4rl/hopper
  file_name: medium.zip
defaults:
  - huggingface: d4rl
  # - data_paths: d4rl 
  - data_paths@cache_data_paths: d4rl
  - model_kwargs: default
  - lr_sched_kwargs: cosine
huggingface:
  activation_function: gelu
  use_fast_attn: True
