kind: "DCDT"
use_critic: False
learning_starts: 0
batch_size: 128
gradient_steps: 1
stochastic_policy: False
loss_fn: "ce"
ent_coef: 0.0
offline_steps: ${run_params.total_timesteps}
buffer_max_len_type: "transition"
buffer_size: 80000000 # 8e7
buffer_weight_by: len 
warmup_steps: 4000
learnable_ret: True
use_amp: True 
compile: True
frozen: False
sep_eval_cache: True
# return conditioning
target_return_type: fixed
a_sample_kwargs:
    top_p: 0.5
# query type
representation_type: mean
cache_steps: 25 
cache_len: ${agent_params.cache_steps}
agg_token: s

freeze_kwargs: 
  exclude_crossattn: True

replay_buffer_kwargs:
  num_workers: 16
  pin_memory: False

cache_kwargs:
  num_workers: 0
  prefetch_factor: null
  pin_memory: False
  init_top_p: 1
  exclude_same_trjs: True
  task_weight: 1
  reweight_top_k: 1
  min_seq_len: 10
  share_trjs: True
  index_kwargs: 
    nb_cores: 64
    # go with Flat index for now, others have colissions and are slower with high nprobe
    index_key: Flat

eval_cache_kwargs: 
  index_kwargs: 
    nb_cores: ${agent_params.cache_kwargs.index_kwargs.nb_cores}
  return_weight: 1
  top_k: 50
  reweight_top_k: ${agent_params.cache_kwargs.reweight_top_k}

load_path:
  dir_path: ${MODELS_DIR}/minihack/dark_room_dense_10x10_sfixed_grand_train
  file_name: dt_medium_64.zip

defaults:
  - huggingface: dt_medium_64
  - data_paths: dark_room_10x10_sfixed_grand_train
  - data_paths@cache_data_paths: ${agent_params/data_paths}
  - model_kwargs: dark_room
  - lr_sched_kwargs: cosine

huggingface:
  activation_function: gelu
  max_length: 50
  add_cross_attention: True
  output_attentions: False
  n_positions: 1600
eval_context_len: ${agent_params.huggingface.max_length}

model_kwargs: 
  global_pos_embds: True
  tokenize_rtg: False
  separate_ca_embed: True
