optimizer: 'SGD'
dataset: 'kuairec_${UL}'
num_sample: 5
weight_decay: 
- 0.00005
- 0.001
lr: 0.01
lr_sch: CosineAnnealingLR
epochs: 120
batch_size: 32
batch_log_interval: 50
train_limit: 5_000_000
lamda: 0.9
experiment: 
  name: 'full_bandit_feedback'
  n_exp: 5
  n_trials: 3
  feedback: 'bandit'
  regularizers: null
  labeled_portion: u0
