model:
  class_path: desiddpayne.models.AIONCrossAttentionProbing
  init_args:
    n_outputs: 16
    num_heads: 16
    model_path: "data/aion/dec24/large"
    num_encoder_tokens: 600
    lr: 1e-4
data:
  class_path: desiddpayne.dataset.DESIDDPayneDatasetModule
  init_args:
    data_dir: "data"
    input_fields: ["tok_xp_bp", "tok_xp_rp"]
    batch_size: 256
    num_workers: 0
    version: "1"
trainer:
  max_epochs: 10
  accelerator: gpu
  precision: "bf16-mixed"
  log_every_n_steps: 1
  callbacks:
    - class_path: LearningRateMonitor
      init_args:
        logging_interval: "step"
  logger:
    class_path: WandbLogger
    init_args:
      name: "large_xatt_xp"
      project: "aion_eval_desiddpayne"
      
      save_dir: "data/AION_Eval/results"
  default_root_dir: "data/AION_Eval/results"
