{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "class config:\n",
    "    data = 'Cora' #choices=[\"Cora\", \"Citeseer\", \"Pubmed\", \"Coauthor-CS\"]\n",
    "    model = 'GAT' #choices=[\"GCN\", \"GAT\", \"APPNP\", \"DAGNN\", \"TreeLSTM\", \"GTCN\", \"GTAN\", \"GTCN2\"]\n",
    "    n_in = 0\n",
    "    n_hid = 64\n",
    "    n_out = 0\n",
    "    num_heads = 1\n",
    "    num_out_heads = 1\n",
    "    device = 'cpu'\n",
    "    dropout = 0.8\n",
    "    dropout2 = 0.8\n",
    "    learning_rate = 0.01\n",
    "    weight_decay = 5e-4\n",
    "    patience = 200\n",
    "    num_iter = 1000\n",
    "    num_test = 30\n",
    "    hop = 2\n",
    "    alpha = 0.1 # used by APPNP only\n",
    "    random_label_split = False\n",
    "    num_train = 20 # for random label split only\n",
    "    num_val = 30 # for random label split only\n",
    "    data_load = True # load the saved label split to rerun the test (for reproduce purpose)\n",
    "    test_id = 1 # number of the test, only used to record the ith number of the random label split (for reproduce purpose)\n",
    "    filter_pct = 0.1 # remove the top and bottom filer_pct points before obtaining statistics of test accuracy\n",
    "    log = False # whether to show the training log or not\n",
    "    eval_metric = 'f1-macro' # evaluation metrics, choices=[\"acc\", \"f1-macro\", \"f1-micro\"]\n",
    "    root_dir = '../..' # dir of the source code\n",
    "\n",
    "args = config()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Using backend: pytorch\n"
     ]
    }
   ],
   "source": [
    "import sys\n",
    "sys.path.append(args.root_dir)\n",
    "from train import *"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "start testing on Cora dataset\n",
      "  NumNodes: 2708\n",
      "  NumEdges: 10556\n",
      "  NumFeats: 1433\n",
      "  NumClasses: 7\n",
      "  NumTrainingSamples: 140\n",
      "  NumValidationSamples: 500\n",
      "  NumTestSamples: 1000\n",
      "Done loading data from cached files.\n",
      "time duration = 6.734, best val f1-macro = 0.817, test f1-macro = 0.824\n",
      "time duration = 6.598, best val f1-macro = 0.815, test f1-macro = 0.822\n",
      "time duration = 9.161, best val f1-macro = 0.818, test f1-macro = 0.818\n",
      "time duration = 8.502, best val f1-macro = 0.815, test f1-macro = 0.821\n",
      "time duration = 10.702, best val f1-macro = 0.812, test f1-macro = 0.820\n",
      "time duration = 9.442, best val f1-macro = 0.820, test f1-macro = 0.819\n",
      "time duration = 6.741, best val f1-macro = 0.824, test f1-macro = 0.831\n",
      "time duration = 12.110, best val f1-macro = 0.813, test f1-macro = 0.815\n",
      "time duration = 10.211, best val f1-macro = 0.806, test f1-macro = 0.810\n",
      "time duration = 8.069, best val f1-macro = 0.816, test f1-macro = 0.824\n",
      "time duration = 8.065, best val f1-macro = 0.815, test f1-macro = 0.816\n",
      "time duration = 7.338, best val f1-macro = 0.812, test f1-macro = 0.801\n",
      "time duration = 8.254, best val f1-macro = 0.812, test f1-macro = 0.810\n",
      "time duration = 7.765, best val f1-macro = 0.807, test f1-macro = 0.820\n",
      "time duration = 8.844, best val f1-macro = 0.822, test f1-macro = 0.820\n",
      "time duration = 7.261, best val f1-macro = 0.815, test f1-macro = 0.818\n",
      "time duration = 9.360, best val f1-macro = 0.819, test f1-macro = 0.812\n",
      "time duration = 13.218, best val f1-macro = 0.821, test f1-macro = 0.815\n",
      "time duration = 6.950, best val f1-macro = 0.823, test f1-macro = 0.820\n",
      "time duration = 6.896, best val f1-macro = 0.811, test f1-macro = 0.803\n",
      "time duration = 6.951, best val f1-macro = 0.822, test f1-macro = 0.812\n",
      "time duration = 11.312, best val f1-macro = 0.816, test f1-macro = 0.811\n",
      "time duration = 7.026, best val f1-macro = 0.825, test f1-macro = 0.846\n",
      "time duration = 5.289, best val f1-macro = 0.815, test f1-macro = 0.816\n",
      "time duration = 9.326, best val f1-macro = 0.821, test f1-macro = 0.804\n",
      "time duration = 5.583, best val f1-macro = 0.808, test f1-macro = 0.797\n",
      "time duration = 6.521, best val f1-macro = 0.816, test f1-macro = 0.814\n",
      "time duration = 12.790, best val f1-macro = 0.821, test f1-macro = 0.810\n",
      "time duration = 11.569, best val f1-macro = 0.812, test f1-macro = 0.821\n",
      "time duration = 8.751, best val f1-macro = 0.815, test f1-macro = 0.818\n",
      "test f1-macro (mean, std):  0.8162300703132189 0.009109291732970162\n",
      "test f1-macro (mean, std) after filter:  0.816076042462317 0.004812308834977867\n",
      "\n",
      "start testing on Citeseer dataset\n",
      "  NumNodes: 3327\n",
      "  NumEdges: 9228\n",
      "  NumFeats: 3703\n",
      "  NumClasses: 6\n",
      "  NumTrainingSamples: 120\n",
      "  NumValidationSamples: 500\n",
      "  NumTestSamples: 1000\n",
      "Done loading data from cached files.\n",
      "time duration = 8.403, best val f1-macro = 0.683, test f1-macro = 0.666\n",
      "time duration = 8.362, best val f1-macro = 0.680, test f1-macro = 0.663\n",
      "time duration = 7.035, best val f1-macro = 0.692, test f1-macro = 0.681\n",
      "time duration = 10.682, best val f1-macro = 0.678, test f1-macro = 0.681\n",
      "time duration = 13.422, best val f1-macro = 0.694, test f1-macro = 0.670\n",
      "time duration = 7.157, best val f1-macro = 0.702, test f1-macro = 0.699\n",
      "time duration = 15.403, best val f1-macro = 0.693, test f1-macro = 0.664\n",
      "time duration = 8.151, best val f1-macro = 0.700, test f1-macro = 0.675\n",
      "time duration = 8.660, best val f1-macro = 0.684, test f1-macro = 0.676\n",
      "time duration = 16.522, best val f1-macro = 0.694, test f1-macro = 0.661\n",
      "time duration = 6.459, best val f1-macro = 0.686, test f1-macro = 0.654\n",
      "time duration = 8.591, best val f1-macro = 0.685, test f1-macro = 0.659\n",
      "time duration = 6.936, best val f1-macro = 0.693, test f1-macro = 0.661\n",
      "time duration = 8.664, best val f1-macro = 0.687, test f1-macro = 0.670\n",
      "time duration = 5.772, best val f1-macro = 0.693, test f1-macro = 0.681\n",
      "time duration = 6.970, best val f1-macro = 0.687, test f1-macro = 0.657\n",
      "time duration = 9.344, best val f1-macro = 0.700, test f1-macro = 0.666\n",
      "time duration = 10.864, best val f1-macro = 0.675, test f1-macro = 0.675\n",
      "time duration = 7.623, best val f1-macro = 0.685, test f1-macro = 0.657\n",
      "time duration = 5.907, best val f1-macro = 0.681, test f1-macro = 0.662\n",
      "time duration = 10.272, best val f1-macro = 0.684, test f1-macro = 0.672\n",
      "time duration = 7.124, best val f1-macro = 0.683, test f1-macro = 0.677\n",
      "time duration = 7.019, best val f1-macro = 0.694, test f1-macro = 0.667\n",
      "time duration = 12.055, best val f1-macro = 0.689, test f1-macro = 0.672\n",
      "time duration = 8.657, best val f1-macro = 0.704, test f1-macro = 0.670\n",
      "time duration = 8.650, best val f1-macro = 0.687, test f1-macro = 0.683\n",
      "time duration = 8.102, best val f1-macro = 0.704, test f1-macro = 0.672\n",
      "time duration = 7.531, best val f1-macro = 0.698, test f1-macro = 0.682\n",
      "time duration = 5.851, best val f1-macro = 0.677, test f1-macro = 0.647\n",
      "time duration = 10.114, best val f1-macro = 0.687, test f1-macro = 0.658\n",
      "test f1-macro (mean, std):  0.6693081065342633 0.010596276663140442\n",
      "test f1-macro (mean, std) after filter:  0.669063770308084 0.0072389806497085\n",
      "\n",
      "start testing on Pubmed dataset\n",
      "  NumNodes: 19717\n",
      "  NumEdges: 88651\n",
      "  NumFeats: 500\n",
      "  NumClasses: 3\n",
      "  NumTrainingSamples: 60\n",
      "  NumValidationSamples: 500\n",
      "  NumTestSamples: 1000\n",
      "Done loading data from cached files.\n",
      "time duration = 19.553, best val f1-macro = 0.812, test f1-macro = 0.778\n",
      "time duration = 35.553, best val f1-macro = 0.818, test f1-macro = 0.775\n",
      "time duration = 22.762, best val f1-macro = 0.809, test f1-macro = 0.768\n",
      "time duration = 24.031, best val f1-macro = 0.813, test f1-macro = 0.768\n",
      "time duration = 66.240, best val f1-macro = 0.816, test f1-macro = 0.772\n",
      "time duration = 27.312, best val f1-macro = 0.815, test f1-macro = 0.769\n",
      "time duration = 23.713, best val f1-macro = 0.800, test f1-macro = 0.774\n",
      "time duration = 39.069, best val f1-macro = 0.809, test f1-macro = 0.783\n",
      "time duration = 35.574, best val f1-macro = 0.806, test f1-macro = 0.772\n",
      "time duration = 19.215, best val f1-macro = 0.803, test f1-macro = 0.770\n",
      "time duration = 35.737, best val f1-macro = 0.812, test f1-macro = 0.759\n",
      "time duration = 18.168, best val f1-macro = 0.799, test f1-macro = 0.767\n",
      "time duration = 22.280, best val f1-macro = 0.803, test f1-macro = 0.773\n",
      "time duration = 42.760, best val f1-macro = 0.811, test f1-macro = 0.766\n",
      "time duration = 23.300, best val f1-macro = 0.801, test f1-macro = 0.768\n",
      "time duration = 18.036, best val f1-macro = 0.806, test f1-macro = 0.767\n",
      "time duration = 41.442, best val f1-macro = 0.815, test f1-macro = 0.779\n",
      "time duration = 30.497, best val f1-macro = 0.814, test f1-macro = 0.768\n",
      "time duration = 29.704, best val f1-macro = 0.811, test f1-macro = 0.777\n",
      "time duration = 27.888, best val f1-macro = 0.805, test f1-macro = 0.775\n",
      "time duration = 26.295, best val f1-macro = 0.801, test f1-macro = 0.757\n",
      "time duration = 50.847, best val f1-macro = 0.806, test f1-macro = 0.768\n",
      "time duration = 22.631, best val f1-macro = 0.811, test f1-macro = 0.776\n",
      "time duration = 38.273, best val f1-macro = 0.814, test f1-macro = 0.769\n",
      "time duration = 39.298, best val f1-macro = 0.810, test f1-macro = 0.769\n",
      "time duration = 18.140, best val f1-macro = 0.804, test f1-macro = 0.773\n",
      "time duration = 23.868, best val f1-macro = 0.806, test f1-macro = 0.766\n",
      "time duration = 24.228, best val f1-macro = 0.809, test f1-macro = 0.775\n",
      "time duration = 33.751, best val f1-macro = 0.816, test f1-macro = 0.774\n",
      "time duration = 57.921, best val f1-macro = 0.809, test f1-macro = 0.756\n",
      "test f1-macro (mean, std):  0.7703408260069854 0.006018003142860337\n",
      "test f1-macro (mean, std) after filter:  0.7707454801555146 0.0033543711241887384\n",
      "\n",
      "start testing on Coauthor-CS dataset with random split: 0\n",
      "time duration = 32.715, best val f1-macro = 0.868, test f1-macro = 0.878\n",
      "time duration = 31.715, best val f1-macro = 0.860, test f1-macro = 0.874\n",
      "time duration = 62.145, best val f1-macro = 0.880, test f1-macro = 0.875\n",
      "time duration = 41.333, best val f1-macro = 0.881, test f1-macro = 0.882\n",
      "time duration = 40.887, best val f1-macro = 0.881, test f1-macro = 0.877\n",
      "time duration = 47.901, best val f1-macro = 0.874, test f1-macro = 0.873\n",
      "time duration = 34.102, best val f1-macro = 0.875, test f1-macro = 0.881\n",
      "time duration = 44.741, best val f1-macro = 0.885, test f1-macro = 0.869\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "time duration = 37.342, best val f1-macro = 0.881, test f1-macro = 0.877\n",
      "time duration = 31.085, best val f1-macro = 0.853, test f1-macro = 0.867\n",
      "time duration = 56.626, best val f1-macro = 0.884, test f1-macro = 0.862\n",
      "time duration = 32.491, best val f1-macro = 0.866, test f1-macro = 0.882\n",
      "time duration = 31.560, best val f1-macro = 0.856, test f1-macro = 0.864\n",
      "time duration = 45.026, best val f1-macro = 0.885, test f1-macro = 0.882\n",
      "time duration = 37.577, best val f1-macro = 0.877, test f1-macro = 0.876\n",
      "time duration = 31.362, best val f1-macro = 0.855, test f1-macro = 0.875\n",
      "time duration = 31.877, best val f1-macro = 0.864, test f1-macro = 0.878\n",
      "time duration = 33.111, best val f1-macro = 0.889, test f1-macro = 0.879\n",
      "time duration = 52.249, best val f1-macro = 0.886, test f1-macro = 0.880\n",
      "time duration = 33.667, best val f1-macro = 0.875, test f1-macro = 0.888\n",
      "time duration = 39.152, best val f1-macro = 0.880, test f1-macro = 0.880\n",
      "time duration = 41.046, best val f1-macro = 0.869, test f1-macro = 0.887\n",
      "time duration = 32.829, best val f1-macro = 0.880, test f1-macro = 0.879\n",
      "time duration = 46.150, best val f1-macro = 0.873, test f1-macro = 0.879\n",
      "time duration = 31.298, best val f1-macro = 0.876, test f1-macro = 0.877\n",
      "time duration = 35.223, best val f1-macro = 0.878, test f1-macro = 0.884\n",
      "time duration = 43.548, best val f1-macro = 0.883, test f1-macro = 0.883\n",
      "time duration = 33.226, best val f1-macro = 0.879, test f1-macro = 0.887\n",
      "time duration = 43.868, best val f1-macro = 0.885, test f1-macro = 0.882\n",
      "time duration = 63.514, best val f1-macro = 0.878, test f1-macro = 0.876\n",
      "test f1-macro (mean, std):  0.8776770595581757 0.006174371126504478\n",
      "test f1-macro (mean, std) after filter:  0.8781706157916993 0.0035473071652848674\n",
      "\n",
      "start testing on Coauthor-CS dataset with random split: 1\n",
      "time duration = 32.767, best val f1-macro = 0.892, test f1-macro = 0.878\n",
      "time duration = 54.761, best val f1-macro = 0.922, test f1-macro = 0.867\n",
      "time duration = 31.466, best val f1-macro = 0.907, test f1-macro = 0.868\n",
      "time duration = 43.012, best val f1-macro = 0.909, test f1-macro = 0.878\n",
      "time duration = 33.554, best val f1-macro = 0.912, test f1-macro = 0.877\n",
      "time duration = 31.231, best val f1-macro = 0.882, test f1-macro = 0.857\n",
      "time duration = 31.379, best val f1-macro = 0.903, test f1-macro = 0.876\n",
      "time duration = 41.723, best val f1-macro = 0.918, test f1-macro = 0.879\n",
      "time duration = 67.235, best val f1-macro = 0.920, test f1-macro = 0.874\n",
      "time duration = 40.007, best val f1-macro = 0.912, test f1-macro = 0.883\n",
      "time duration = 34.124, best val f1-macro = 0.912, test f1-macro = 0.882\n",
      "time duration = 34.503, best val f1-macro = 0.908, test f1-macro = 0.883\n",
      "time duration = 42.574, best val f1-macro = 0.916, test f1-macro = 0.880\n",
      "time duration = 32.710, best val f1-macro = 0.914, test f1-macro = 0.879\n",
      "time duration = 31.569, best val f1-macro = 0.898, test f1-macro = 0.863\n",
      "time duration = 33.941, best val f1-macro = 0.914, test f1-macro = 0.883\n",
      "time duration = 32.818, best val f1-macro = 0.912, test f1-macro = 0.874\n",
      "time duration = 32.869, best val f1-macro = 0.912, test f1-macro = 0.879\n",
      "time duration = 58.788, best val f1-macro = 0.913, test f1-macro = 0.873\n",
      "time duration = 32.377, best val f1-macro = 0.909, test f1-macro = 0.875\n",
      "time duration = 33.352, best val f1-macro = 0.916, test f1-macro = 0.875\n",
      "time duration = 34.524, best val f1-macro = 0.914, test f1-macro = 0.882\n",
      "time duration = 32.766, best val f1-macro = 0.918, test f1-macro = 0.885\n",
      "time duration = 41.584, best val f1-macro = 0.916, test f1-macro = 0.880\n",
      "time duration = 32.957, best val f1-macro = 0.907, test f1-macro = 0.871\n",
      "time duration = 41.412, best val f1-macro = 0.918, test f1-macro = 0.878\n",
      "time duration = 37.102, best val f1-macro = 0.907, test f1-macro = 0.882\n",
      "time duration = 33.471, best val f1-macro = 0.911, test f1-macro = 0.883\n",
      "time duration = 31.612, best val f1-macro = 0.907, test f1-macro = 0.878\n",
      "time duration = 71.592, best val f1-macro = 0.920, test f1-macro = 0.880\n",
      "test f1-macro (mean, std):  0.8766485138376622 0.006158694777392887\n",
      "test f1-macro (mean, std) after filter:  0.8775443823999379 0.003622039307114685\n",
      "\n",
      "start testing on Coauthor-CS dataset with random split: 2\n",
      "time duration = 31.453, best val f1-macro = 0.858, test f1-macro = 0.864\n",
      "time duration = 32.261, best val f1-macro = 0.869, test f1-macro = 0.866\n",
      "time duration = 49.805, best val f1-macro = 0.905, test f1-macro = 0.880\n",
      "time duration = 35.940, best val f1-macro = 0.881, test f1-macro = 0.863\n",
      "time duration = 36.894, best val f1-macro = 0.894, test f1-macro = 0.874\n",
      "time duration = 34.576, best val f1-macro = 0.888, test f1-macro = 0.873\n",
      "time duration = 31.567, best val f1-macro = 0.864, test f1-macro = 0.855\n",
      "time duration = 31.998, best val f1-macro = 0.874, test f1-macro = 0.871\n",
      "time duration = 55.190, best val f1-macro = 0.902, test f1-macro = 0.864\n",
      "time duration = 36.889, best val f1-macro = 0.908, test f1-macro = 0.875\n",
      "time duration = 42.074, best val f1-macro = 0.890, test f1-macro = 0.876\n",
      "time duration = 31.118, best val f1-macro = 0.853, test f1-macro = 0.844\n",
      "time duration = 41.898, best val f1-macro = 0.894, test f1-macro = 0.857\n",
      "time duration = 31.056, best val f1-macro = 0.874, test f1-macro = 0.865\n",
      "time duration = 32.598, best val f1-macro = 0.882, test f1-macro = 0.871\n",
      "time duration = 31.329, best val f1-macro = 0.847, test f1-macro = 0.862\n",
      "time duration = 39.205, best val f1-macro = 0.906, test f1-macro = 0.869\n",
      "time duration = 83.610, best val f1-macro = 0.896, test f1-macro = 0.864\n",
      "time duration = 43.960, best val f1-macro = 0.891, test f1-macro = 0.872\n",
      "time duration = 44.072, best val f1-macro = 0.899, test f1-macro = 0.872\n",
      "time duration = 34.670, best val f1-macro = 0.897, test f1-macro = 0.864\n",
      "time duration = 48.907, best val f1-macro = 0.895, test f1-macro = 0.869\n",
      "time duration = 37.970, best val f1-macro = 0.899, test f1-macro = 0.871\n",
      "time duration = 32.360, best val f1-macro = 0.876, test f1-macro = 0.876\n",
      "time duration = 48.901, best val f1-macro = 0.894, test f1-macro = 0.866\n",
      "time duration = 36.770, best val f1-macro = 0.903, test f1-macro = 0.877\n",
      "time duration = 42.875, best val f1-macro = 0.902, test f1-macro = 0.876\n",
      "time duration = 39.391, best val f1-macro = 0.904, test f1-macro = 0.879\n",
      "time duration = 45.611, best val f1-macro = 0.907, test f1-macro = 0.870\n",
      "time duration = 48.800, best val f1-macro = 0.899, test f1-macro = 0.869\n",
      "test f1-macro (mean, std):  0.8685233479125051 0.007610545234634457\n",
      "test f1-macro (mean, std) after filter:  0.8693305167623512 0.004456600508857055\n"
     ]
    }
   ],
   "source": [
    "accs = []\n",
    "datasets = ['Cora', 'Citeseer', 'Pubmed', 'Coauthor-CS']\n",
    "for dataset in datasets:\n",
    "    args.data = dataset\n",
    "    if dataset == 'Cora':\n",
    "        args.dropout = 0.8\n",
    "        args.dropout2 = 0.8\n",
    "        print('\\nstart testing on ' + dataset + ' dataset')\n",
    "        accs.append(main(args))\n",
    "    elif dataset == 'Citeseer':\n",
    "        args.dropout = 0.8\n",
    "        args.dropout2 = 0.8\n",
    "        print('\\nstart testing on ' + dataset + ' dataset')\n",
    "        accs.append(main(args))\n",
    "    elif dataset == 'Pubmed':\n",
    "        args.dropout = 0.8\n",
    "        args.dropout2 = 0.2\n",
    "        print('\\nstart testing on ' + dataset + ' dataset')\n",
    "        accs.append(main(args))\n",
    "    elif dataset == 'Coauthor-CS':\n",
    "        args.dropout = 0.8\n",
    "        args.dropout2 = 0.2\n",
    "        for i in range(3):\n",
    "            print('\\nstart testing on ' + dataset + ' dataset with random split: ' + str(i))\n",
    "            args.test_id = i\n",
    "            accs.append(main(args))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "accs = np.array(accs)\n",
    "np.savetxt('log_f1_macro/f1-macro_GAT_hop2.txt',accs)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
