{
      "mode": "fewshot",
      "output_dir": "proj_1",
      "device": "cuda",
      "resume_from_checkpoint": "checkpoints/v4:llama1b_inst_all-checkpoint-hypernet-step97952.pt",
      "resume_from_checkpoint_reset_steps": false,
      "save_state": true,
      "train_batch_size": 8,
      "subset_batch_size": 128,
      "eval_batch_size": 8,
      "learning_rate": 1e-4,
      "max_grad_norm": 1.0,
      "weight_decay": 5e-6,
      "adam_beta1": 0.9,
      "adam_beta2": 0.999,
      "adam_epsilon": 1e-8,
      "epochs": 5,
      "warmup_steps": 1000,
      "logging_steps": 64,
      "save_steps_l": [1024, 2048, 4096, 8192, 16384],
      "eval_steps_l": [1024, 2048, 4096, 8192, 16384],
      "generate_steps_l": [1024, 2048, 4096, 8192, 16384],
      "generate_steps": null,
      "eval_steps": null,
      "save_steps": null,
      "eval_at_step_zero": false,
      "generate_at_step_zero": false,
      "gradient_accumulation_steps": 8,
      "pad_to_multiple_of": 8,
      "debug": false,
      "augment_emb_space": true,
      "feed_txt_embs": true,
      "menc_names_or_paths": [
            "timm/ViT-L-16-SigLIP2-384",
            "OpenGVLab/ViCLIP-B-16",
            "Cacophony"
      ],
      "fewshot_menc_names_or_paths": [
            "acharkq/MolCA"
      ],
      "fewshot_load_extracted_features": [true],
      "mm_dim": 768,
      "load_extracted_features": [true, true, true],
      "mm_dtype": "float32",
      "lm_name_or_path": "meta-llama/Llama-3.2-1B-Instruct",
      "lm_dtype": "bfloat16",
      "dataset_names_or_paths": ["sharegpt4v", "sharegpt4video", "clothodetail"],
      "fewshot_dataset_names_or_paths": ["chebi20"],
      "fewshot_dataset_sizes": ["full"],
      "fewshot_epochs": [10],
      "proj_name_or_path": "checkpoints/v1:llama1b_inst_all_extracted-checkpoint-projector-best.pt",
      "proj_arch": "mlp",
      "proj_act": "quick_gelu",
      "proj_n_layers": 2,
      "hn_name_or_path": "hypnet_1",
      "hn_arch": "attention",
      "hn_hypnet_dim": 768,
      "hn_rank": 32,
      "hn_alpha": 32,
      "hn_predict_bias": true,
      "hn_principled_init": false,
      "hn_n_proj_layers": null,
      "hn_use_pos_encs": true,
      "finetune_generated_projector": true
}
