#@package _global_

defaults:
  - /experiment/glue/glue-cola.yaml 

callbacks:
  width_monitor:
    _target_: src.callbacks.width_monitor.WidthMonitor
  bert_num_params:
    _target_: src.callbacks.flop_count.NumParamsBertGaudi



task:
  budget_in_ratio: 0.5
  layer_type: "gaudi"
  scale_gaudi_lr: true
  gaudi_params:
    rank_per_component: 1
    total_rank_ratio: 1
    fixed_width: false
    fixed_location: false
    min_widths: [0.0, 0.0]
    max_widths: [1.0, 1.0]
    width_init: 'splr'
    compute_mode: "dense"
    location_init: 0. #'linspace'
    width_learning_rate: 0.0001
    width_weight_decay: 0.0
    location_learning_rate: ${.width_learning_rate}
    beta: 2.0
    adam_betas: [0.0, 0.999]
    on_freq_domain: false
    scaled_gaussian: false
    val_with_gaussian: true
    kernel: "dirichlet"
