RUN_NAME: 'FE'
ALGORITHM: 'dfs'
MODEL:
  DECODER_USE_LAST_HIDDEN: True
  PROCESSOR_USE_LAST_HIDDEN: True
  PROCESSOR:
    NAME: "FE"
    KWARGS: [{aggregation: "max"}]
    PASS_BATCH: True
    LAYERNORM:
      ENABLE: True
      MODE: "node"
  NUM_STEPS: 1
  GRU:
    ENABLE: False

TRAIN:
  LOSS:
    OUTPUT_LOSS_WEIGHT: 1.0
    HINT_LOSS_WEIGHT: 0.0
    HIDDEN_LOSS_WEIGHT: 0.0
  MAX_EPOCHS: 100
  BATCH_SIZE: 8

  ENABLE: True
  NUM_WORKERS: 4
  EARLY_STOPPING_PATIENCE: 30
  OPTIMIZER:
    LR: 0.0004239

  SCHEDULER:
    ENABLE: True
    NAME: "ReduceLROnPlateau"
    PARAMS: [{"mode": "min", "factor": 0.1, "patience": 10, "verbose": True}]

TEST:
  BATCH_SIZE: 8

LOGGING:
  WANDB:
    GROUP: 'dfs'
    ENTITY: 'ENTITY'
