python modal_fever_run.py \
 --model_name gpt2 \
 --train_samples 50000 \
 --eval_samples 5000 \
 --max_seq_len 256 \
 --epochs 5 \
 --batch_size 16 \
 --lr 5e-5 \
 --consistency_loss_weight 0.5 \
 --freeze_lower_layers_epochs 1 \
 --seed 42 \
 --output_stem fever50k_tightened_diag \
 --variants no_consistency_loss,evidence_only_pooling,evidence_only_strict,claim_only_pooling,evidence_only_random_labels
