
seed: 0
exp_name: basic_test

batch_size: 2
eval_batch_size: 2
debug: false
fsdp_port: null
datasets: [hh]


wandb:
  enabled: false  


local_dirs: [.cache]
local_run_dir: ${get_local_run_dir:${exp_name},${local_dirs}}


lr: 1e-5
gradient_accumulation_steps: 1
max_grad_norm: 1.0


max_length: 256
max_prompt_length: 128


n_epochs: 1
n_examples: null
n_eval_examples: 8
trainer: BasicTrainer
optimizer: AdamW
warmup_steps: 10
activation_checkpointing: false
eval_every: 100
minimum_log_interval_secs: 1.0


sample_during_eval: false
n_eval_model_samples: 1
do_first_eval: false

defaults:
- _self_
- model: gpt2_small
- loss: tidpo 