
seed: 0
exp_name: stable_test


batch_size: 1 
eval_batch_size: 1
debug: false
fsdp_port: null
datasets: [hh]


wandb:
  enabled: false


local_dirs: [.cache]
local_run_dir: ${get_local_run_dir:${exp_name},${local_dirs}}


lr: 1e-6  
gradient_accumulation_steps: 4 
max_grad_norm: 0.5  


max_length: 128  
max_prompt_length: 64


n_epochs: 1
n_examples: null
n_eval_examples: 4
trainer: BasicTrainer
optimizer: AdamW
warmup_steps: 50
activation_checkpointing: false
eval_every: 50
minimum_log_interval_secs: 1.0


sample_during_eval: false
n_eval_model_samples: 1
do_first_eval: false

defaults:
- _self_
- model: gpt2_small
- loss: tidpo 