{
  "dataset": {
    "dataset": "ActivityNet",
    "feature_path": "sub_activitynet_v1-3.c3d.hdf5",
    "vocab_size": 8000,
    "word_dim": 300,
    "frame_dim": 500,
    "max_num_words": 20,
    "max_num_frames": 200,
    "target_stride": 1,
    "train_data": "data/activitynet/train.json",
    "test_data": "data/activitynet/test_trivial.json",
    "val_data": "data/activitynet/val.json",
    "vocab_path": "data/activitynet/glove.pkl"
  },
  "train": {
    "optimizer": {
      "lr": 4e-4,
      "weight_decay": 0,
      "warmup_updates": 400,
      "warmup_init_lr": 1e-7
    },
    "batch_size": 32,
    "max_num_epochs": 30,
    "model_saved_path": "checkpoints/ActivityNet/"
  },
  "model": {
    "name": "PCNet",
    "config": {
      "frames_input_size": 500,
      "words_input_size": 300,
      "hidden_size": 256,
      "use_negative": true,
      "num_props": 8,
      "sigma": 4, 
      "sigma_neg": 3,
      "gamma": 0,  
      "dropout": 0.1,
      "DualTransformer": {
        "d_model": 256,
        "num_heads": 4,
        "num_decoder_layers1": 3,
        "num_decoder_layers2": 3,
        "dropout": 0.1
      }
    }
  },
  "loss": {
    "margin_1": 0.1,
    "margin_2": 0.15,
    "lambda": 0.15,
    "alpha_1": 1,
    "alpha_2": 0.1,
    "inter_lambda": 0.13
  }
}