name: v90_gspo_puzzles_extra_pass8
output_dir: results/exploration_analysis/v90_gspo_puzzles_extra_pass8
primitive_batch_size: 512
primitive_classifier: learned
primitive_confidence_threshold: 0.01
primitive_fp16: true
primitive_multi_gpu: false
primitive_n_models: 1
segmentation:
  max_tokens: 250
  min_tokens: 80
  tokenizer: allenai/OLMo-3-7B-Instruct-SFT
gspo_checkpoints:
  gspo_v2_sft_step20:
    sft_base: v2
    puzzle_results: results/v90_puzzles_extra_pass8/gspo_v2_s20
task_filter:
- bridges_10x10dh_pass8
- undead_5x5dm_pass8
