defaults:
  - _self_

_target_: haipr.models.esmc.ESMCPredictor
model_name: ${model.name}
name: esmc_300m
num_classes: 0 # regression
is_neural: true
optimization_direction: maximize
optimization_metric: spearman_r
feature_type: sequence 
batch_size: 64
patience: 3
loss: huber
learning_rate: 1e-4
weight_decay: 1e-2
#  use for override 
peft:
  target_modules: out_proj

search_space:
  # model.batch_size: choice(4, 8, 16, 32) 
  # model.loss: choice(mse, huber, l1)
  # model.learning_rate: tag(log, interval(1e-6, 1e-3))
  # model.weight_decay: tag(log, interval(1e-4, 1e-1))
  peft.rank: choice(1, 2, 4, 8, 16, 32)
  peft.dropout: choice(0.1, 0.2, 0.3, 0.4, 0.5)

prediction_head:
  _target_: haipr.models.mlp.MLP
  input_dim: 960 # 1152 for 600m
  output_dim: 1
  num_layers: 1
  hidden_dim: 8
  dropout: 0.5
  activation: 
    _target_: torch.nn.ReLU
