name: REDDIT-BINARY-fix-mean-that-include-zeros
program: main.py
method: bayes
metric:
  name: summary/temporal/final_acc
  goal: maximize
  impute: latest
parameters:
  dataset:
    value: REDDITBINARY
  device:
    value: 0
  special_pooling_type:
    value: temporal
  batch_size:
    values: [4, 8, 16]
  hidden_dim:
    values: [8, 16, 32, 64]
  lr:
    values: [0.01, 0.02, 0.005, 0.0001]
  mha_dropout:
    values: [0.1, 0.2, 0.5]
  num_head:
    values: [1, 4]
  attn_mask_dropout:
    values: ["false", "true"]
  use_fc:
    values: ["true", "false"]
  add_zero_attn:
    values: ["true", "false"]
  weight_decay:
    values: [0.0, 0.001, 0.01]
  use_layer_norm:
    values: ["true", "false"]
  skip_connection:
    values: ["true", "false"]
  alpha_type:
    values: ["learnable", "fixed", "never_negative_gradient"]