base_model: pythia-70m
variant: ~
task: ioi
cache: /mnt/hdd-0/circuits-over-time/model_cache/ct
dataset_size: 70
batch_size: 70
checkpoint_schedule: all
overwrite: false
device: cuda:1