_target_: skempi

# data_dir: ${data_dir} # data_dir is specified in config.yaml
data_dir: '${paths.data_dir}/cath_4.3'
chain_set_jsonl: 'chain_set.jsonl'
chain_set_splits_json: 'chain_set_splits.json'
csv_path: '${paths.data_dir}/SKEMPI_v2_cache'
pdb_dir: '${paths.data_dir}/SKEMPI_v2_cache'
cache_dir: '${paths.data_dir}/SKEMPI_v2_cache'
num_cvfolds: 3
cvfold_index: 0
batch_size: 1024
max_length: 1024 # 393
atoms: ['N', 'CA', 'C', 'O']

# alphabet related
alphabet:
  name: esm
  featurizer: skempi
  featurizer_cfg:
    to_pifold_format: true

# dataloader related
max_tokens: 20000
sort: true
num_workers: 8
pin_memory: true
