model:
  name: "llama3.2-1B"
  hugging_face_model_id: "./.llama3.2-1B"
  type: "decoder"
  num_layers: 16
  hidden_dim: 2048
  batch_size: 2

dataset:
  name: "MothRadioHour"
  remove_format_chars: True
  remove_punc_spacing: True

attribution:
  flag: True
  method: "gxi"
  layers: [4,9,12] #[4,9,12,15]
  context_length: 640
  top_mass: [1,5,10,20,30,40,50,60,70,80,90,95,98] #[1,2,3,5,10,20,30,40,50,60,70,80,90,95,98]

experiment:
  output_root_dir: ./outputs

  num_delays: 4
  subject_idx: ''
  normalize_data_by_run: True
  apply_pca: False
  num_red_components: -1
  num_folds: 11
  num_tr_trim: 5

  verbose: True
