ENV_VARS:
  CUDA_DEVICE_MAX_CONNECTIONS: 1
  SKIP_PYTEST: 1
MODEL_ARGS:
  trainer.num_nodes: 1
  trainer.devices: 8
  trainer.max_steps: 50
  trainer.val_check_interval: 50
  trainer.limit_val_batches: 50
  trainer.strategy.tensor_model_parallel_size: 2
  trainer.strategy.pipeline_model_parallel_size: 2
  trainer.strategy.sequence_parallel: True
  data.micro_batch_size: 2
  data.global_batch_size: 32
  data.seq_length: 512
  log.log_dir: ${CHECKPOINT_SAVE_PATH}
TEST_TYPE: regular
