model_args:
  model_type: "llama2"
  model_name: "jeffwan/llama-30b-hf"
  k_name: "self_attn.k_proj"
  q_name: "self_attn.q_proj"
  v_name: "self_attn.v_proj"
  o_name: "self_attn.o_proj"
  up_name: "mlp.up_proj"
  down_name: "mlp.down_proj"
  gate_name: "mlp.gate_proj"
  group_size: 2
  compression_ratio: 20
  context_length: 2048
  stride: 2048
  share_part:
    - "v"
    - "k"
    - "q"
    - "up"
    - "gate"
  private_part:
    - "down"
    - "o"

calibration_args:
  dataset_name: "wikitext"
  build_calib: true
  calib_path: "./calib/llama-30b/wikitext/"
  dataset_cache_dir: null
  calibration_size: 256
  calib_batch_size: 2

after_calibration_update_args:
  update_calib_path: ""
  build_update_calib: false
  update: false


model_saving:
  save_updated_model: false
  updated_model_path: "./updated_model/share_llama-30b_20/wikitext"
  save_untrained_model: true
  untrained_model_path: "./untrained_model/share_llama-30b_20/wikitext"

lora_args:
  save_lora: true
  lora_r: 8
  lora_alpha: 32
  lora_output_dir: "./lora/share_llama-30b_20/wikitext"
  lora_train_batch_size: 1
  lora_learning_rate: 1.e-4
  lora_train_epoch: 2
  lora_run_name: "share_llama-30b_20"
