seed: 555
use_wandb: true

compression_config:
  num_stages: 2
  layer12:
    layer_idx: 11 
    forward: topk
    forward-EF: false
    forward-EF-method: EF21
    forward-params:
      topk: 0.5
    backward: topk
    backward-EF: false
    backward-EF-method: EF21
    backward-params:
      topk: 0.5

training:
  learning_rate: 0.00005   
  model: llama2
  dataset: wikitext
  dataset_config_name: wikitext-2-v1
  epochs: 1
  batch_size: 16
  block_size: 256
  gradient_checkpointing: false
  aq_sgd: false                    
  lazy_sampling: false
  lazy_sampling_params:
    schedule: constant
    p_t: 0.5


micronum: 4
wandb:
  project: llama2-pipeline  # gpt2-compression
  name: lazy-test

output_dir: '/home/1/clapping_for_c4'