{
  "title": "Analyzing the Effectiveness of the Underlying Reasoning Tasks in Multi-hop Question Answering",
  "number_of_tables": 10,
  "classification_of_tables": {
    "0": 0,
    "1": 1,
    "2": 2,
    "3": 3,
    "4": 3,
    "5": 3,
    "6": 3,
    "7": 3,
    "8": 3,
    "9": 3
  },
  "selected_datasets": "2Wiki",
  "selected_table_index": 0,
  "metrics": "Exact Match (EM), F1 score",
  "selected_table_metrics": [
    "EM",
    "F1"
  ],
  "selected_table_core_results": {
    "EM": 79.68,
    "F1": 76.64
  },
  "selected_table_settings_model_size": "BigBird-base",
  "selected_table_settings_training_strategy": "Multi-task learning",
  "selected_table_settings_hyperparameter_selection": {
    "Learning rate": "3e-5",
    "Weight decay": "0.01",
    "Batch size": "32",
    "Gradient accumulation step": "8",
    "Dropout probability": "0.1"
  },
  "github": "https://github.com/Alab-NII/multi-hop-analysis"
}