data:
  !include ../base_data_setting.yml
  
environment:
   dotenv_path: .env
  
model:

  # meta-llama/Llama-3.2-1B-Instruct
  # meta-llama/Llama-3.2-3B-Instruct
  # meta-llama/Llama-3.1-8B-Instruct
  model_name: meta-llama/Llama-3.1-8B-Instruct
  model_type: llama3.1

  # "llama-3.1" is similar to llama-3.2
  # See https://docs.unsloth.ai/basics/chat-templates
  # chatml: Supports zephyr, chatml, mistral, llama, alpaca, vicuna, vicuna_old, unsloth
  chat_template: llama-3.1

  max_seq_length: 2048
  load_in_4bit: false


train:
  data_synthetic: !include ../gpt4o-DSynt_data_setting.yml

  plan_type: latent

  epoch: 4
  # 2e-4
  learning_rate: 0.0002 
  per_device_train_batch_size: 4
  gradient_accumulation_steps: 4
  weight_decay: 0.01
  lr_scheduler: linear
  
  lora:
    # Rank parameter for LoRA. The smaller this value, the fewer parameters will be modified.
    # Choose any number > 0 ! Suggested 8, 16, 32, 64, 128
    r: 16
    target_modules:
      - q_proj
      - k_proj
      - v_proj
      - o_proj
      - gate_proj
      - up_proj
      - down_proj
    # Alpha parameter for LoRA. This value determines the strength of the applied LoRA.
    lora_alpha: 16
    # Supports any, but = 0 is optimized
    lora_dropout: 0
    # Supports any, but = "none" is optimized
    bias: none
    # Whether to use gradient checkpointing to improve memory efficiency
    # True or "unsloth" for very long context
    use_gradient_checkpointing: unsloth
    # Seed value for random number generation
    random_state: 3407
    use_rslora: false
    loftq_config: null

logging:
  log_steps: 1
  # path where to save, empty for no saving

  checkpoint_path: experiments/checkpoints
  result_path: experiments/results
  logging_path: experiments/loggings
  visualization_path: experiments/visualizations


evaluation:
  per_device_eval_batch_size: 4

