# @package _global_

# MLP Encoder configuration example
# This configuration file demonstrates how to configure MLP encoder parameters for different datasets

# train.py arguments
project_name: regress-lm-mlp-encoder
experiment_name: regress-lm-mlp-${now:%Y-%m-%d_%H-%M-%S}
use_wandb: false
log_dir: logs
seed: 42
batch_size: 128
num_epochs: 100
learning_rate: 1e-5
save_every_n_epochs: 10
best_save_metric: "val_mean_reward" # Metric for selecting best model during training, options: val_loss, val_mean_reward
eval_mode: false
skip_mode: false
base: 2
digits: 8
# Learning rate scheduler
scheduler:
  type: cosine
  warmup_steps: 100
  min_lr_ratio: 0.1

# Model parameters - using MLP encoder
model:
  max_input_len: 1024
  max_num_objs: 1
  d_model: 256
  num_encoder_layers: 3
  num_decoder_layers: 3
  nhead: 4
  dim_feedforward: 1024
  dropout: 0.1
  
  # MLP Encoder configuration
  encoder_type: "mlp"  # Use MLP encoder instead of vanilla transformer
  
  # MLP encoder specific parameters
  # Adjust these parameters according to your data feature dimensions
  input_dim: 42        # Input feature dimension, adjust according to dataset
  hidden_dims: [1024, 1024, 1024]  # MLP hidden layer dimension list
  output_dim: 256      # Output dimension, must be the same as d_model
  
  # Optional: more complex MLP configuration examples
  # hidden_dims: [64, 128, 256, 128, 64]  # Deeper network
  # hidden_dims: [512, 512]               # Wider network

reinforce:
  enabled: true
  temperature: 1.0  # Sampling temperature, controls exploration degree
  num_samples: 16    # Number of samples generated per input
  reward_scale: 1.0 # Reward scaling factor
  epsilon: 1e-8
  one_sided_norm: true
  expert_ce_weight: 0.05

# Dataset parameters
dataset:
  name: "dataset-name"  # Replace with your dataset name
  path:
    train: null
    val: null
  params:
    data_dir: regression_data


# Pretrained checkpoint path (optional)
init_checkpoint: null

# Other configurations
hydra:
  run:
    dir: outputs/${now:%Y-%m-%d}/${now:%H-%M-%S}

save_dir: outputs/mlp-encoder/${now:%Y-%m-%d}/${now:%H-%M-%S}/checkpoints
if_ntl: false

# Notes: input_dim configuration suggestions for different datasets
# - For numerical features: input_dim = number of features
# - For text features: input_dim = word embedding dimension
# - For mixed features: input_dim = total dimension of all features
