# config.yml
experiment:
  trial_name: E2E_experiment\
  random_seed: 110
  work_dir: ./trained_models/GPT2_M/e2e/AdamW
  save_interval: 1000
  max_epoch: 5
  platform: local
  model_card: gpt2.md

data:
  train_data: ./data/e2e/train.jsonl
  valid_data: ./data/e2e/valid.jsonl
  train_batch_size: 8
  valid_batch_size: 4
  seq_len: 512

optimization:
  opt: adamw
  lr: 1e-2
  weight_decay: 0.01
  correct_bias: true
  scheduler: linear
  warmup_step: 500
  grad_acc: 1
  label_smooth: 0.1

adamw:
  adam_beta2: 0.999

lora:
  enable: true
  lora_dim: 4
  lora_alpha: 32
  lora_dropout: 0.1

init:
  init_checkpoint: ./pretrained_checkpoints/gpt2-medium-pytorch_model.bin
  clip: 0.0
