model:
  name: "gemma"
  hugging_face_model_id: "google/gemma-2b"
  type: "decoder"
  num_layers: 18
  hidden_dim: 2048
  batch_size: 2

dataset:
  name: "MothRadioHour"
  remove_format_chars: True
  remove_punc_spacing: True

attribution:
  flag: True
  method: 'gxi'
  layers: [5,6,12] #[5,6,12,17]
  context_length: 640
  top_mass: [1,2,3,5,10,20,30,40,50,60,70,80,90,95,98]

experiment:
  output_root_dir: ./outputs

  num_delays: 4
  subject_idx: ''
  normalize_data_by_run: True
  apply_pca: False
  num_red_components: -1
  num_folds: 11
  num_tr_trim: 5

  verbose: True
