torchrun --nproc_per_node 4 \
-m FlagEmbedding.baai_general_embedding.finetune.run \
--output_dir data/bge-m3-custom \
--model_name_or_path BAAI/bge-m3 \
--train_data data/embedding_data_minedHN.jsonl \
--learning_rate 1e-5 \
--fp16 \
--num_train_epochs 5 \
--per_device_train_batch_size 16 \
--dataloader_drop_last True \
--normlized True \
--temperature 0.02 \
--query_max_len 800 \
--passage_max_len 800 \
--train_group_size 4 \
--negatives_cross_device \
--logging_steps 10 \
--logging_steps 100 \
--gradient_accumulation_steps 4 \
--save_total_limit 1 \
--query_instruction_for_retrieval ""



torchrun --nproc_per_node 1 \
-m FlagEmbedding.baai_general_embedding.finetune.run \
--output_dir data/sentence_croissant_alpha_v0.3 \
--model_name_or_path croissantllm/CroissantLLMBase \
--train_data data/embedding_data_minedHN.jsonl \
--learning_rate 1e-5 \
--fp16 \
--num_train_epochs 1 \
--per_device_train_batch_size 8 \
--dataloader_drop_last True \
--normlized True \
--temperature 0.02 \
--query_max_len 800 \
--passage_max_len 800 \
--train_group_size 2 \
--negatives_cross_device \
--logging_steps 100 \
--gradient_accumulation_steps 4 \
--query_instruction_for_retrieval ""



# BAAI/bge-m3   -> to mine negatives