defaults: # loads default configs
  - task: nlp/conversation
  - optimizer: sgd
  - scheduler: reduce_lr_on_plateau
  - training: default
  - trainer: default
  - trainer/logger: wandb
  - hydra: output/custom
  - override dataset: nlp/conversation/my_daily_dialog

backbone:
  pretrained_model_name_or_path: facebook/blenderbot-400M-distill

dataset:
  cfg:
    history_delimiter: '  '
    history_size: 3
    hierarchical: False
    eval_batch_size: 12

task:
  _target_: lightning_transformers.task.nlp.conversation.ConversationTransformer
  cfg:
    compute_generate_metrics: True
    task_name: conversation_ct
    scheduler_monitor: val_loss
    scheduler_mode: min
    no_repeat_ngram_size: 3 # 3 by default
    encoder_no_repeat_ngram_size: 3 # 3 by default
    min_length: 20 # 20 by default
    max_length: 30
    num_beams: 10 # 10 by default
    history_delimiter: ${dataset.cfg.history_delimiter}
    history_size: ${dataset.cfg.history_size}

trainer:
  gpus: 1
  val_check_interval: 1000
  max_steps: 50000
  max_epochs: 100
  gradient_clip_val: 0.1
  resume_from_checkpoint: ${trainer.default_root_dir}/last.ckpt
  default_root_dir: ${oc.env:HOME}/storage/trained/lit/${task.cfg.task_name}/${backbone.pretrained_model_name_or_path}_${dataset.cfg.pretrained_dataset_name}/${experiment_name}
  logger:
    project: ct

training:
  lr: 0.05
  batch_size: 6

optimizer:
  weight_decay: 0

experiment_name: ${now:%Y-%m-%d}_${now:%H-%M-%S-%f}
log: True
ignore_warnings: True # todo: check warnings before release
seed: 0
stage: train # choose from train, test, (predict, interact, to be added)
finetune_ckpt: null
