_target_: haipr.models.esm3.ESM3Predictor
model_name: esm3_sm_open_v1
num_classes: 0 # regression
is_neural: true
name: ESM3
use_structure: true
chain_break_token: "|"
# optimization
optimization_direction: maximize
optimization_metric: spearman_r
# data
feature_type: sequence
# model
batch_size: 16
loss: huber
learning_rate: 0.001
weight_decay: 0.01

peft:
  target_modules: "all_linnear" # dummy gets programatically overwritten in @esm3.py

prediction_head: 
  _target_: haipr.models.mlp.MLP
  input_dim: 1536
  output_dim: 1
  num_layers: 1
  hidden_dim: 8
  dropout: 0.5
  activation: 
    _target_: torch.nn.ReLU

search_space:
  model.learning_rate: tag(log, interval(1e-6, 1e-3))
  model.weight_decay: tag(log, interval(1e-4, 1e-1))
  model.batch_size: choice(16, 32, 64, 128)
  model.loss: choice(mse, huber, l1)