# Simple test config - focus on basic functionality
seed: 0
exp_name: simple_test

# Basic training parameters
batch_size: 2
eval_batch_size: 2
debug: false
fsdp_port: null
datasets: [hh]

# wandb config
enabled: false  # Disable wandb for simple test

# Local directories
local_dirs: [.cache]
local_run_dir: ${get_local_run_dir:${exp_name},${local_dirs}}

# Learning rate and optimizer
lr: 1e-5
gradient_accumulation_steps: 1
max_grad_norm: 1.0

# Sequence length - use small values for stability
max_length: 256
max_prompt_length: 128

# Training settings
n_epochs: 1
n_examples: null
n_eval_examples: 8
trainer: BasicTrainer
optimizer: AdamW
warmup_steps: 10
activation_checkpointing: false
eval_every: 100
minimum_log_interval_secs: 1.0

# Disable sampling
sample_during_eval: false
n_eval_model_samples: 1
do_first_eval: false

defaults:
- _self_
- model: gpt2_small
- loss: tidpo 