base_model: pythia-70m
variant: ~
cache: model_cache
checkpoint_schedule:
  - 512
  - 1000
  - 2000
  - 3000
  - 4000
  - 8000
  - 16000
  - 32000
  - 64000
  - 80000
  - 85000
  - 128000
  - 143000
start_layer: 2
overwrite: false