python main.py -m \
    save_checkpoint=True \
    logger.offline=False \
    training.io_mode="IreplacedR-O" \
    training.aux_io_mode="IreplacedR-O" \
    data=strategyqa \
    model=aux_lm \
    model.arch=t5-base \
    model.optimizer.lr=3e-4 \
    model/scheduler=linear_with_warmup \
    model.scheduler.warmup_updates=0.06 \
    setup.train_batch_size=16 \
    setup.accumulate_grad_batches=1 \
    setup.eff_train_batch_size=16 \
    setup.eval_batch_size=16 \
    setup.num_workers=3 \
    seed=0,1,2

python main.py -m \
    save_checkpoint=False \
    logger.offline=False \
    training=finetune \
    training.ckpt_path="'LFTR-5068/checkpoints/epoch=7-step=647.ckpt'" \
    training.io_mode="I-O" \
    training.aux_io_mode="IreplacedR-O" \
    data=strategyqa \
    model=kd_lm \
    model.arch=t5-base \
    model.optimizer.lr=3e-4,5e-4 \
    model/scheduler=linear_with_warmup \
    model.scheduler.warmup_updates=0.06 \
    setup.train_batch_size=16 \
    setup.accumulate_grad_batches=1 \
    setup.eff_train_batch_size=16 \
    setup.eval_batch_size=16 \
    setup.num_workers=3 \
    seed=0

python main.py -m \
    save_checkpoint=False \
    logger.offline=False \
    training=finetune \
    training.ckpt_path="'LFTR-5069/checkpoints/epoch=4-step=404.ckpt'" \
    training.io_mode="I-O" \
    training.aux_io_mode="IreplacedR-O" \
    data=strategyqa \
    model=kd_lm \
    model.arch=t5-base \
    model.optimizer.lr=3e-4,5e-4 \
    model/scheduler=linear_with_warmup \
    model.scheduler.warmup_updates=0.06 \
    setup.train_batch_size=16 \
    setup.accumulate_grad_batches=1 \
    setup.eff_train_batch_size=16 \
    setup.eval_batch_size=16 \
    setup.num_workers=3 \
    seed=1

python main.py -m \
    save_checkpoint=False \
    logger.offline=False \
    training=finetune \
    training.ckpt_path="'LFTR-5070/checkpoints/epoch=8-step=728.ckpt'" \
    training.io_mode="I-O" \
    training.aux_io_mode="IreplacedR-O" \
    data=strategyqa \
    model=kd_lm \
    model.arch=t5-base \
    model.optimizer.lr=3e-4,5e-4 \
    model/scheduler=linear_with_warmup \
    model.scheduler.warmup_updates=0.06 \
    setup.train_batch_size=16 \
    setup.accumulate_grad_batches=1 \
    setup.eff_train_batch_size=16 \
    setup.eval_batch_size=16 \
    setup.num_workers=3 \
    seed=2



python main.py -m \
    save_checkpoint=True \
    logger.offline=False \
    training.io_mode="IreplacedR-O" \
    training.aux_io_mode="IreplacedR-O" \
    data=strategyqa \
    model=aux_lm \
    model.arch=t5-large \
    model.optimizer.lr=5E-5 \
    model/scheduler=linear_with_warmup \
    model.scheduler.warmup_updates=0.06 \
    setup.train_batch_size=16 \
    setup.accumulate_grad_batches=1 \
    setup.eff_train_batch_size=16 \
    setup.eval_batch_size=16 \
    setup.num_workers=3 \
    seed=0,1,2

python main.py -m \
    save_checkpoint=False \
    logger.offline=False \
    training=finetune \
    training.ckpt_path="'LFTR-5119/checkpoints/epoch=8-step=728.ckpt'" \
    training.io_mode="I-O" \
    training.aux_io_mode="IreplacedR-O" \
    data=strategyqa \
    model=kd_lm \
    model.arch=t5-large \
    model.optimizer.lr=1E-4,3E-4 \
    model/scheduler=linear_with_warmup \
    model.scheduler.warmup_updates=0.06 \
    setup.train_batch_size=16 \
    setup.accumulate_grad_batches=1 \
    setup.eff_train_batch_size=16 \
    setup.eval_batch_size=16 \
    setup.num_workers=3 \
    seed=0

python main.py -m \
    save_checkpoint=False \
    logger.offline=False \
    training=finetune \
    training.ckpt_path="'LFTR-5120/checkpoints/epoch=2-step=242.ckpt'" \
    training.io_mode="I-O" \
    training.aux_io_mode="IreplacedR-O" \
    data=strategyqa \
    model=kd_lm \
    model.arch=t5-large \
    model.optimizer.lr=1E-4,3E-4 \
    model/scheduler=linear_with_warmup \
    model.scheduler.warmup_updates=0.06 \
    setup.train_batch_size=16 \
    setup.accumulate_grad_batches=1 \
    setup.eff_train_batch_size=16 \
    setup.eval_batch_size=16 \
    setup.num_workers=3 \
    seed=1

python main.py -m \
    save_checkpoint=False \
    logger.offline=False \
    training=finetune \
    training.ckpt_path="'LFTR-5121/checkpoints/epoch=8-step=728.ckpt'" \
    training.io_mode="I-O" \
    training.aux_io_mode="IreplacedR-O" \
    data=strategyqa \
    model=kd_lm \
    model.arch=t5-large \
    model.optimizer.lr=1E-4,3E-4 \
    model/scheduler=linear_with_warmup \
    model.scheduler.warmup_updates=0.06 \
    setup.train_batch_size=16 \
    setup.accumulate_grad_batches=1 \
    setup.eff_train_batch_size=16 \
    setup.eval_batch_size=16 \
    setup.num_workers=3 \
    seed=2

python main.py -m \
    save_checkpoint=False \
    logger.offline=False \
    training=finetune \
    training.ckpt_path="'LFTR-5119/checkpoints/epoch=8-step=728.ckpt'" \
    training.io_mode="I-O" \
    training.aux_io_mode="IreplacedR-O" \
    data=strategyqa \
    model=kd_lm \
    model.arch=t5-base \
    model.aux_arch=t5-large \
    model.optimizer.lr=4E-4,5E-4 \
    model/scheduler=linear_with_warmup \
    model.scheduler.warmup_updates=0.06 \
    setup.train_batch_size=16 \
    setup.accumulate_grad_batches=1 \
    setup.eff_train_batch_size=16 \
    setup.eval_batch_size=16 \
    setup.num_workers=3 \
    seed=0 \
    model.kd_input=True,False \
    model.kd_target=True

python main.py -m \
    save_checkpoint=False \
    logger.offline=False \
    training=finetune \
    training.ckpt_path="'LFTR-5120/checkpoints/epoch=2-step=242.ckpt'" \
    training.io_mode="I-O" \
    training.aux_io_mode="IreplacedR-O" \
    data=strategyqa \
    model=kd_lm \
    model.arch=t5-base \
    model.aux_arch=t5-large \
    model.optimizer.lr=4E-4,5E-4 \
    model/scheduler=linear_with_warmup \
    model.scheduler.warmup_updates=0.06 \
    setup.train_batch_size=16 \
    setup.accumulate_grad_batches=1 \
    setup.eff_train_batch_size=16 \
    setup.eval_batch_size=16 \
    setup.num_workers=3 \
    seed=1 \
    model.kd_input=True,False \
    model.kd_target=True

python main.py -m \
    save_checkpoint=False \
    logger.offline=False \
    training=finetune \
    training.ckpt_path="'LFTR-5121/checkpoints/epoch=8-step=728.ckpt'" \
    training.io_mode="I-O" \
    training.aux_io_mode="IreplacedR-O" \
    data=strategyqa \
    model=kd_lm \
    model.arch=t5-base \
    model.aux_arch=t5-large \
    model.optimizer.lr=4E-4,5E-4 \
    model/scheduler=linear_with_warmup \
    model.scheduler.warmup_updates=0.06 \
    setup.train_batch_size=16 \
    setup.accumulate_grad_batches=1 \
    setup.eff_train_batch_size=16 \
    setup.eval_batch_size=16 \
    setup.num_workers=3 \
    seed=2 \
    model.kd_input=True,False \
    model.kd_target=True