# need 4 gpus

project: coconut
save_path: ckpts
name: "sprosqa-graph-coconut-2layer-8head-768dim-fixed-bug-mix-no-answer-coconut-0.1-25ep-no-neg"

only_eval: False

coconut: True
cot: False
no_thoughts: False
no_cot: False

c_thought: 1
epochs_per_stage: 25
max_latent_stage: 4
pad_latent_to_max: True

save_only_improve: False
uniform_prob: 0.1
model_id: configs/symbol-2layer-8head-768dim.json
load_model_path: None
seed: 0
resume: 0
bf16: False
train_path: data/prosqa_train_graph_4_coconut.json
val_path: data/prosqa_valid_graph_4_coconut.json
reset_optimizer: False
batch_size_training: 64
debug: False
gradient_accumulation_steps: 1
num_epochs: 300
lr: !!float "1e-4"
weight_decay: 0.01