optimizer:
  learning_rate: 0.00005     
  adam_eps: 1.0e-08
  adam_weight_decay: 0.01
  adam_betas: [0.9, 0.999]
  warmup_steps: 2000
  max_steps: 450000 


LLM:
  cache_dir: ./huggingfaceModel
  # model_name: 'chaoyi-wu/PMC_LLAMA_7B'   ###bsize 16
  # model_name: 'meta-llama/Meta-Llama-3-8B'  ###bsize 10
  model_name: meta-llama/Llama-3.1-8B  ###bsize 10
  model_name: google/gemma-2-9b  ###bsize 10
  model_name: google/gemma-2-9b-it  ###bsize 10
  model_name: bigscience/bloom-7b1 ## bsize 8 
  model_name: nvidia/Llama-3.1-Nemotron-70B-Instruct 
  model_name: google/gemma-2-27b-it
  model_name: meta-llama/Llama-3.2-11B-Vision 
  model_name: deepseek-ai/DeepSeek-R1-Distill-Llama-8B
  model_name: deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B

  # model_name: 'openai-community/gpt2-large'  ###bsize 36
  # model_name: 'EleutherAI/gpt-neo-2.7B'
  # model_name: 'epfl-llm/meditron-70b'
  # model_name : distilbert/distilgpt2     ###bsize 160   
  # model_name : google/gemma-2b            ###bsize 32  
  # model_name : google/gemma-2-2b-it            ###bsize 24  
  # model_name : meta-llama/Llama-2-7b-hf     ###bsize 16

  # model_name: 'axiong/PMC_LLaMA_13B'
  # model_name: 'chaoyi-wu/MedLLaMA_13B'
  # model_name: 'ruslanmv/Medical-Llama3-8B'
  # model_name: 'TsinghuaC3I/Llama-3-8B-UltraMedical'
  # model_name: 'aaditya/Llama3-OpenBioLLM-8B'
  # model_name: 'ruslanmv/Medical-Llama3-v2'
  # model_name: 'instruction-pretrain/medicine-Llama3-8B'
  # model_name: 'sethuiyer/Medichat-Llama3-8B'

  seq_length: 256


path_vqa:
  image_main_path: './Path-VQA/pvqa/images'
  qa_main_path: './Path-VQA/pvqa/qas/'

pmc_oa:
  image_main_path: './BreastCancerData/MultiModal/caption_T060_filtered_top4_sep_v0_subfigures/'
  json_files_main_path: './BreastCancerData/MultiModal/'

pmc_vqa:
  image_main_path: './PMC-VQA/'
  train_csv_path: './PMC-VQA/train_combined.csv'
  valid_csv_path: './PMC-VQA/test_combined.csv'

rad_vqa:
  main_path: './VQA-RAD/'
  image_main_path: './VQA-RAD/VQA_RAD Image Folder'

slake_vqa:
  image_main_path: './Slake-VQA/imgs/'
  train_json_path: './Slake-VQA/train.json'
  valid_json_path: './Slake-VQA/validate.json'
  test_json_path: './Slake-VQA/test.json'



omnimed_vqa:
  image_main_path: './OmniMedVQA/OmniMedVQA/'
  train_json_path: './OmniMedVQA/train.json'
  valid_json_path: './OmniMedVQA/valid.json'




dataset_list : [

    # 'path-vqa',
    'rad-vqa',
    # 'slake-vqa',
    # 'pmc-oa',
    # 'pmc-vqa',
    # 'omnimed-vqa',

]

num_devices: 1
wandb_folder_path : ./WANDB
image_size: [224, 224]
num_workers: 8
prefetch_factor: 3
checkpoint_dirpath: './checkpoints/LLM-MED/'
max_epochs: 35
lora_rank: 8

project: 'LLMED-V1'
experiment_name: 'All'
img_token_num: 2
ckpt_path: ''

batch_size: 128
accumulation: 1

is_inference: False 

# vision_module : Vit512
vision_module: BiomedCLIP
n_inference_lim: 500

# Vision_module: 'UNI'
# Vision_module: 'CLIP'
# Vision_module: 'Scratch'

###### to check 
# exp name 
# model name 
# train.py pretrained ckpoint 
# rad vqa dataset if chatgpt
# rad vqa dataset if question guess 


