filename: stage1

strategy_name: deepspeed
accelerator: gpu
devices:
  - 0
precision: bf16-mixed
max_epochs: 50
check_val_every_n_epoch: 1
save_every_n_epochs: 5
accumulate_grad_batches: 2

weight_decay: 0.05
init_lr: 1.0e-4
min_lr: 5.0e-6
warmup_lr: 1.0e-6
warmup_steps: 1000
scheduler: linear_warmup_cosine_lr


tune_gnn: False
temperature: 0.1
