{
    "checkpoint_frequency": 1000,
    "checkpoint_to_directly_load_model": null,
    "delete_exist_dir": false,
    "early_stopping": true,
    "early_stopping_num_checkpoints_without_improvement": 5,
    "eval_batch_size": 16,
    "eval_template_idx": -2,
    "evaluate_type": "inference",
    "experiment_dir": "exp_out/merging/ia3-bigscience-T0_3B/tpa-es10_ia3_base_test",
    "experiment_name": "tpa-es10_ia3_base_test",
    "few_shot_random_seed": null,
    "function_to_merge_checkpoints": null,
    "gradient_accumulation_factor": 16,
    "inference_dataset": null,
    "inference_dataset_mixture": "T0_held_out",
    "lambda_init": 0.2,
    "lambda_type": "vector-shared",
    "learn_pretraining_lambda": false,
    "length_normalization": false,
    "lr": 0.0001,
    "max_datapoints_per_dataset": 500000,
    "max_datapoints_per_dataset_without_templates": null,
    "max_gen_len": 64,
    "max_seq_len": 512,
    "model_checkpoints": null,
    "model_lambda": null,
    "norm_to_clip_gradient": null,
    "num_batches": 10000,
    "num_val_samples": 32,
    "optimizer": "adamw",
    "peft_method": "ia3",
    "pretrained_lambda_type": "scalar-shared",
    "pretrained_model": "bigscience/T0_3B",
    "pretraining_init": 1,
    "project_name": "merging",
    "projection_loss": 0,
    "resume_checkpoint_filepath": null,
    "scheduler": null,
    "search_lambda": "none",
    "seed": 42,
    "should_eval_at_beginning": true,
    "should_eval_train": false,
    "should_eval_validation": true,
    "should_save_every_checkpoint": false,
    "should_save_most_recent_state": true,
    "should_save_to_gcp": false,
    "split": "test",
    "temperature": 1,
    "train_batch_size": 8,
    "train_dataset": null,
    "train_dataset_mixture": "T0_held_out",
    "train_template_idx": -2,
    "trainable_param_regex": null,
    "use_bfloat16_during_eval": true,
    "use_bfloat16_during_training": true,
    "warmup_ratio": 0.0,
    "weight_decay": 0.0,
    "world_size": null
}
