aml:
  workspace: mlw-deeplearning1h7w
  compute: ia-a100-cluster-hp #ia-a100-instance #ia-a100-cluster-hp #  ia-cpu-instance # 
  environment: cuda121-py312-uv
  exp_name: cross-encoder-nli-triplet
  job_name: ${split:${model.backbone}}
  file: main.py

data:
  train: nli_triplet
  test: [nli_triplet]
  is_test: false
  is_dummy: false

model:
  arch: cross-encoder-nli-triplet
  backbone:  aarabil/bert-base-uncased  # aarabil/Qwen3-Embedding-0.6B    answerdotai/ModernBERT-base #Alibaba-NLP/gte-modernbert-base  aarabil/deberta-v3-base 

save_mdl:
  name: ${model.backbone}-nli-triplet

metrics:
  binary: ["roc"]
  multiclass: ["f1"]

pretraining:
  is_on: true
  batch_size: 32
  epochs: 3
  lr_backbone: 8e-6
  lr_head:  4e-5 # ${pretraining.lr_backbone}
  lr_schedule: cosine
  freeze_backbone_until: 0
  patience: 10

# finetuning:
#   is_on: false
#   batch_size: 32
#   epochs:  1
#   lr_backbone: 1e-5
#   lr_head: 1e-5
#   lr_schedule: linear
#   freeze_backbone_until: 0 
#   patience: 1e9    

# --------------- hydra configs -------------------------------

# activate with -m flag
hydra:
  sweeper:
    params:
      model.backbone:  aarabil/bert-large-uncased, aarabil/deberta-v3-large, answerdotai/ModernBERT-large

  run:  
    dir: . # hydra/outputs/${now:%Y-%m-%d}/${now:%H-%M-%S}
  sweep:
    dir: hydra/outputs/${now:%Y-%m-%d}/${now:%H-%M-%S}
  output_subdir: null

defaults:
  - _self_
  - mode: null
  - override hydra/job_logging: disabled
  
    




