defaults:
  - default

# strategy: ddp
strategy: ddp_find_unused_parameters_true #查有没有没用的para
  
accelerator: gpu
devices: 1 # option [1,2,3,4,5,6,7]
num_nodes: 1
sync_batchnorm: True
accumulate_grad_batches: 1
precision: bf16-mixed           # 使用 bfloat16 精度
