trainer:
  accelerator: auto
  devices: auto
  max_steps: -1
  max_epochs: -1
  gradient_clip_val: 1
  default_root_dir: "logs/protstruct_encode/"
  logger: false
  callbacks:
    - class_path: modelgenerator.structure_tokenizer.callbacks.StructTokensCallback
      dict_kwargs:
        output_dir: "logs/protstruct_encode/"
        write_interval: "epoch"

model:
  class_path: modelgenerator.structure_tokenizer.models.EquiformerEncoderLightning
  init_args:
    pretrained_model_name_or_path: "genbio-ai/AIDO.StructureEncoder"

data:
  class_path: modelgenerator.structure_tokenizer.datasets.ProteinLightningDataModule
  init_args:
    config:
      num_workers: 0
      seed: 0
      proteins_datasets_configs:
        - name: "casp15"
          registry_path: "data/protstruct_sample_data/registries/casp15_merged.csv"
          folder_path: "data/protstruct_sample_data/CASP15_merged/"
          max_nb_res: 1024
          batch_size: 2
          seed: 0
