cond_force_retrain: true
model_config:
  act_config:
    demo_pkl: data/stack_task_D0/100_actions.pkl
    input_len: 7
    scale: true
    scale_output: false
    type: identity
  dan: true
  demo_pkl: data/stack_task_D0/100_r3m_full.pkl
  fusion_config:
    batch_norm: false
    demo_pkl: data/stack_task_D0/100_r3m_full.pkl
    dropout_rate: 0.0
    hidden_dims:
    - 1024
    - 512
    - 512
    optimizer: 0
    output_len: 7
    scale: true
    scale_input: false
    type: mlp
  prop_config:
    batch_norm: false
    demo_pkl: data/stack_task_D0/100_proprio.pkl
    input_len: 9
    optimizer: 1
    scale: true
    scale_output: false
    type: identity
  r3m_config:
    input_len: 512
    rgb_height: 224
    rgb_width: 224
    scale: false
    type: identity
  retrieval_config:
    decay_rate: -0.7944318560051231
    final_neighbors_ratio: 0.2630981787611679
    k: 835
    lookback: 41
    method: knn
  sideload_r3m: true
  tune: false
  type: r3m_dan
train_config:
  batch_size: 32
  epochs: 32
  #epochs: 206
  force_retrain: true
  model_name: r3m_dan
  optimizers:
    0:
      lr: 1e-3
      weight_decay: 1e-5

#[I 2025-08-09 23:18:05,599] Trial 248 finished with value: 0.76 and parameters: {'epochs': 32, 'k': 835, 'lookback': 41, 'decay_rate': -0.7944318560051231, 'final_neighbors_ratio': 0.2630981787611679}. Best is trial 248 with value: 0.76.

