SYSTEM:
  DEBUGGING_LEVEL: INFO
  NUM_GPUS: 1
  NUM_WORKERS: 4
  OUT_DIR: arel_hard_roberta_prefix
  SEED: 123
VIST:
  BATCH_PER_GPU: 16
  CAPTION_TYPE: stories
  DATASET_SAMPLE_OVERFIT: 10
  DII_ROOT: /n/fs/nlp-xxxx/datasets/VIST/dii
  DIS_ROOT: /n/fs/nlp-xxxx/datasets/VIST/dis
  GENERATED_STORIES_PATH_TRAIN: /n/fs/nlp-xxxx/datasets/VIST/preprocessed/arel/hard_gen_stories_with_prefix_train.json
  GENERATED_STORIES_PATH_VAL: /n/fs/nlp-xxxx/datasets/VIST/preprocessed/arel/hard_gen_stories_with_prefix_val.json
  GENERATED_STORIES_PATH_TEST: /n/fs/nlp-xxxx/datasets/VIST/preprocessed/arel/hard_gen_stories_with_prefix_test.json
  DISTRACTOR_PATH_TRAIN: configs/vist_distractor_ids/seed-123/train_hard_sampled_distractors.json 
  DISTRACTOR_PATH_VAL: configs/vist_distractor_ids/seed-123/val_hard_sampled_distractors.json
  DISTRACTOR_PATH_TEST: configs/vist_distractor_ids/seed-123/test_hard_sampled_distractors.json
  MAX_LEN_CAPTION: 20
  NUM_DISTRACTORS: 4
  NUM_EPOCHS: 10
  OVERFIT: false
  SIS_ROOT: /n/fs/nlp-xxxx/datasets/VIST/sis
  MODEL_TYPE: ROBERTA
  MODEL_PATH: roberta-base
  LR: 0.00002
  LOG_EVERY: 20
  SAVE_EVERY_N_EPOCHS: 1
  DROPOUT: 0.2
  MARGIN: 1