{
    "model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-3-8B-Instruct-mntp",
    "peft_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-3-8B-Instruct-mntp-supervised",
    "bidirectional": true,
    "pooling_mode": "mean",
    "dataset_name": "E5",
    "dataset_file_path": "../data/echo-data",
    "remove_unused_columns": false,
    "learning_rate": 2e-4,
    "num_train_epochs": 1,
    "warmup_ratio": 0.1,
    "per_device_train_batch_size": 8,
    "per_device_eval_batch_size": 8,
    "gradient_accumulation_steps": 16,
    "do_train": true,
    "disable_tqdm": false,
    "max_seq_length": 1024,
    "overwrite_output_dir": true,
    "output_dir": "../saved_models/LLM2Vec_MetaLlama3_RARe",
    "logging_steps": 10,
    "save_steps": 200,
    "save_only_model": true,
    "stop_after_n_steps": 1000,
    "lora_r": 4,
    "gradient_checkpointing": true,
    "torch_dtype": "bfloat16",
    "seed": 42,
    "attn_implementation": "flash_attention_2",
    "retrieve_queries": true,
    "dataset_size": 100000,
    "n_ic_examples": 5
}