defaults:
  - agents: bet_mlp_vision_agent

agent_name: bet_mlp_vision
log_dir: logs/sorting/

train_data_path: environments/dataset/data/sorting/4_boxes_train_files.pkl
eval_data_path: environments/dataset/data/sorting/4_boxes_eval_files.pkl

num_boxes: 4

# insert wandb here
wandb:
  entity: ???
  project: ???

group: sorting_${agent_name}

hydra:
  run:
    dir: ${log_dir}/runs/${agent_name}/${now:%Y-%m-%d}/${now:%H-%M-%S}
  sweep:
    dir: ${log_dir}/sweeps/${agent_name}/${now:%Y-%m-%d}/${now:%H-%M-%S}
    subdir: ${hydra.job.override_dirname}

seed: 42

# Network
hidden_dim: 128
num_hidden_layers: 4

# transformer
n_layer: 4
n_head: 4
n_embd: 72

# Training
train_batch_size: 64
val_batch_size: 64
num_workers: 2
device: 'cuda'
epoch: 4
eval_every_n_epochs: 2
scale_data: True

# Environment
obs_dim: 2
action_dim: 2
max_len_data: 600
window_size: 1

# Dataset
trainset:
  _target_: environments.dataset.sorting_dataset.Sorting_Img_Dataset
  data_directory: ${train_data_path}
  obs_dim: ${obs_dim}
  action_dim: ${action_dim}
  max_len_data: ${max_len_data}
  window_size: ${window_size}
  num_boxes: ${num_boxes}

valset:
  _target_: environments.dataset.sorting_dataset.Sorting_Img_Dataset
  data_directory: ${eval_data_path}
  obs_dim: ${obs_dim}
  action_dim: ${action_dim}
  max_len_data: ${max_len_data}
  window_size: ${window_size}
  num_boxes: ${num_boxes}

# sim during training
train_simulation:
  _target_: simulation.sorting_sim.Sorting_Sim
  seed: ${seed}
  device: ${device}
  render: False
  n_cores: 1
  n_contexts: 1
  n_trajectories_per_context: 1
  max_steps_per_episode: 700
  if_vision: True
  num_box: ${num_boxes}

# Simulation
simulation:
  _target_: simulation.sorting_sim.Sorting_Sim
  seed: ${seed}
  device: ${device}
  render: False
  n_cores: 5
  n_contexts: 60
  n_trajectories_per_context: 18
  max_steps_per_episode: 700
  if_vision: True
  num_box: ${num_boxes}