SYSTEM:
  DEBUGGING_LEVEL: INFO
  NUM_GPUS: 1
  NUM_WORKERS: 4
  OUT_DIR: no_finetuned_hard_roberta
  SEED: 123
VIST:
  BATCH_PER_GPU: 16
  CAPTION_TYPE: stories
  DATASET_SAMPLE_OVERFIT: 10
  DII_ROOT: /n/fs/nlp-xxxx/datasets/VIST/dii
  DIS_ROOT: /n/fs/nlp-xxxx/datasets/VIST/dis
  GENERATED_STORIES_PATH_TRAIN: /n/fs/nlp-xxxx/datasets/VIST/preprocessed/no_finetuning/train_hard_gen_caption.json
  GENERATED_STORIES_PATH_VAL: /n/fs/nlp-xxxx/datasets/VIST/preprocessed/no_finetuning/val_hard_gen_caption.json
  GENERATED_STORIES_PATH_TEST: /n/fs/nlp-xxxx/datasets/VIST/preprocessed/no_finetuning/test_hard_gen_caption.json
  DISTRACTOR_PATH_TRAIN: configs/vist_distractor_ids/seed-123/train_hard_sampled_distractors.json 
  DISTRACTOR_PATH_VAL: configs/vist_distractor_ids/seed-123/val_hard_sampled_distractors.json
  DISTRACTOR_PATH_TEST: configs/vist_distractor_ids/seed-123/test_hard_sampled_distractors.json
  MAX_LEN_CAPTION: 20
  NUM_DISTRACTORS: 4
  NUM_EPOCHS: 20
  OVERFIT: false
  SIS_ROOT: /n/fs/nlp-xxxx/datasets/VIST/sis
  MODEL_TYPE: ROBERTA
  MODEL_PATH: roberta-base
  LR: 0.00002
  LOG_EVERY: 20
  SAVE_EVERY_N_EPOCHS: 1
  DROPOUT: 0.2
  MARGIN: 1