inherit: 
    - models/tiny.yaml

model:
    family: gpt2_nn
    n_positions: 101
    zero_pad_embed: False
    n_intermediate_activations: 0
    n_seen_intermediate: 0
    hidden_sep_linear: False

training:
    data: gaussian
    task: long_chain
    task_kwargs: 
        mode: 'relu'
    batch_size: 64
    learning_rate: 0.0001
    save_every_steps: 1000
    keep_every_steps: 1000
    train_steps: 50001
    curriculum:
        dims:
            start: 5
            end: 5
            inc: 1
            interval: 2000
