_target_: lightning.pytorch.trainer.Trainer

default_root_dir: ${paths.output_dir}

# train/val
min_epochs: 100
max_epochs: -1
max_steps: 150000
max_time: null
check_val_every_n_epoch: null
val_check_interval: 1000
log_every_n_steps: 5
enable_progress_bar: True
num_sanity_val_steps: 0
use_distributed_sampler: True

# backend
accelerator: auto
devices: auto
accumulate_grad_batches: 1

# strategy: ddp_find_unused_parameters_true

strategy:
  _target_: lightning.pytorch.strategies.DDPStrategy
  find_unused_parameters: True
  # process_group_backend: "nccl"
  timeout:
    _target_: datetime.timedelta
    seconds: 86400

precision: bf16-mixed
num_nodes: 1

# grad clip
gradient_clip_val: 1.0
gradient_clip_algorithm: "norm"

# inference
deterministic: False
inference_mode: False

# misc
detect_anomaly: False
sync_batchnorm: False
fast_dev_run: False
reload_dataloaders_every_n_epochs: 0 # set to a positive integer to allow valid-test during training

# other common args
limit_train_batches: null
limit_val_batches: null
limit_test_batches: null
profiler: null
