{
  "general_multi_llama_3_1_8b_4bits_r4": {
    "base_model": "meta-llama/Llama-3.1-8B-Instruct",
    "dataset_path": "../data/train/multi/general_multi.jsonl",
    "lora_r": 4,
    "quant_bits": 4,
    "learning_rate": 0.0001,
    "num_epochs": 4,
    "batch_size": 8,
    "gradient_accumulation_steps": 2
  },
  "general_multi_llama_3_1_8b_8bits_r8": {
    "base_model": "meta-llama/Llama-3.1-8B-Instruct",
    "dataset_path": "../data/train/multi/general_multi.jsonl",
    "lora_r": 8,
    "quant_bits": 8,
    "learning_rate": 0.0001,
    "num_epochs": 4,
    "batch_size": 8,
    "gradient_accumulation_steps": 2
  },
  "general_multi_llama_3_1_8b_8bits_r8_dora": {
    "base_model": "meta-llama/Llama-3.1-8B-Instruct",
    "dataset_path": "../data/train/multi/general_multi.jsonl",
    "lora_r": 8,
    "quant_bits": 8,
    "learning_rate": 0.0001,
    "num_epochs": 4,
    "batch_size": 8,
    "gradient_accumulation_steps": 2,
    "peft_use_dora": true
  },
  "general_multi_llama_3_1_8b_8bits_r8_rslora": {
    "base_model": "meta-llama/Llama-3.1-8B-Instruct",
    "dataset_path": "../data/train/multi/general_multi.jsonl",
    "lora_r": 8,
    "quant_bits": 8,
    "learning_rate": 0.0001,
    "num_epochs": 4,
    "batch_size": 8,
    "gradient_accumulation_steps": 2,
    "peft_use_rslora": true
  },
  "reporting_multi_llama_3_1_8b_4bits_r4": {
    "base_model": "meta-llama/Llama-3.1-8B-Instruct",
    "dataset_path": "../data/train/multi/reporting_multi.jsonl",
    "lora_r": 4,
    "quant_bits": 4,
    "learning_rate": 0.0001,
    "num_epochs": 1,
    "batch_size": 1,
    "gradient_accumulation_steps": 8
  },
  "reporting_multi_llama_3_1_8b_8bits_r8": {
    "base_model": "meta-llama/Llama-3.1-8B-Instruct",
    "dataset_path": "../data/train/multi/reporting_multi.jsonl",
    "lora_r": 8,
    "quant_bits": 8,
    "learning_rate": 0.0001,
    "num_epochs": 1,
    "batch_size": 1,
    "gradient_accumulation_steps": 8
  },
  "reporting_multi_llama_3_1_8b_8bits_r8_dora": {
    "base_model": "meta-llama/Llama-3.1-8B-Instruct",
    "dataset_path": "../data/train/multi/reporting_multi.jsonl",
    "lora_r": 8,
    "quant_bits": 8,
    "learning_rate": 0.0001,
    "num_epochs": 1,
    "batch_size": 1,
    "gradient_accumulation_steps": 8,
    "peft_use_dora": true
  },
  "reporting_multi_llama_3_1_8b_8bits_r8_rslora": {
    "base_model": "meta-llama/Llama-3.1-8B-Instruct",
    "dataset_path": "../data/train/multi/reporting_multi.jsonl",
    "lora_r": 8,
    "quant_bits": 8,
    "learning_rate": 0.0001,
    "num_epochs": 1,
    "batch_size": 1,
    "gradient_accumulation_steps": 8,
    "peft_use_rslora": true
  },
  "analysis_multi_llama_3_1_8b_4bits_r4": {
    "base_model": "meta-llama/Llama-3.1-8B-Instruct",
    "dataset_path": "../data/train/multi/analysis_multi.jsonl",
    "lora_r": 4,
    "quant_bits": 4,
    "learning_rate": 0.0001,
    "num_epochs": 1,
    "batch_size": 1,
    "gradient_accumulation_steps": 2
  },
  "analysis_multi_llama_3_1_8b_8bits_r8": {
    "base_model": "meta-llama/Llama-3.1-8B-Instruct",
    "dataset_path": "../data/train/multi/analysis_multi.jsonl",
    "lora_r": 8,
    "quant_bits": 8,
    "learning_rate": 0.0001,
    "num_epochs": 1,
    "batch_size": 1,
    "gradient_accumulation_steps": 2
  },
  "analysis_multi_llama_3_1_8b_8bits_r8_dora": {
    "base_model": "meta-llama/Llama-3.1-8B-Instruct",
    "dataset_path": "../data/train/multi/analysis_multi.jsonl",
    "lora_r": 8,
    "quant_bits": 8,
    "learning_rate": 0.0001,
    "num_epochs": 1,
    "batch_size": 1,
    "gradient_accumulation_steps": 2,
    "peft_use_dora": true
  },
  "analysis_multi_llama_3_1_8b_8bits_r8_rslora": {
    "base_model": "meta-llama/Llama-3.1-8B-Instruct",
    "dataset_path": "../data/train/multi/analysis_multi.jsonl",
    "lora_r": 8,
    "quant_bits": 8,
    "learning_rate": 0.0001,
    "num_epochs": 1,
    "batch_size": 1,
    "gradient_accumulation_steps": 2,
    "peft_use_rslora": true
  }
}
