seed: 42
teach: dfs-pruned 
# num_train: 500000
num_tokens: 13000000 
num_epochs: 200 
num_node_tokens: 102 
context_length: 400 
batch_size: 1000
eval_steps: 1000
log_steps: 1000
save_steps: 1000
gradient_accumulation_steps: 1
weight_decay: 0.05
warmup_ratio: 0.1
lr: 0.003
lr_scheduler_type: cosine
save_total_limit: 2
model_config: configs/model_config.yaml
output_dir: output
data_dir: data
train_file: train_flower_d5-s3-l5-b3_decision_st-far_n500000.json 
val_file: val_flower_d5-s3-l5-b3_decision_st-far_n5000.json 
# wandb_config:
#   project: # fill in your wandb project name
#   entity:  # fill in your wandb entity name
#   dir: wandb

