{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "class config:\n",
    "    data = 'Cora' #choices=[\"Cora\", \"Citeseer\", \"Pubmed\", \"Coauthor-CS\"]\n",
    "    model = 'GTAN' #choices=[\"GCN\", \"GAT\", \"APPNP\", \"DAGNN\", \"TreeLSTM\", \"GTCN\", \"GTAN\", \"GTCN2\"]\n",
    "    n_in = 0\n",
    "    n_hid = 64\n",
    "    n_out = 0\n",
    "    num_heads = 1\n",
    "    num_out_heads = 1\n",
    "    device = 'cpu'\n",
    "    dropout = 0.6\n",
    "    dropout2 = 0\n",
    "    learning_rate = 0.01\n",
    "    weight_decay = 5e-4\n",
    "    patience = 300\n",
    "    num_iter = 1000\n",
    "    num_test = 30\n",
    "    hop = 10\n",
    "    alpha = 0.1 # used by APPNP only\n",
    "    random_label_split = False\n",
    "    num_train = 20 # for random label split only\n",
    "    num_val = 30 # for random label split only\n",
    "    data_load = True # load the saved label split to rerun the test (for reproduce purpose)\n",
    "    test_id = 1 # number of the test, only used to record the ith number of the random label split (for reproduce purpose)\n",
    "    filter_pct = 0.1 # remove the top and bottom filer_pct points before obtaining statistics of test accuracy\n",
    "    log = False # whether to show the training log or not\n",
    "    eval_metric = 'f1-macro' # evaluation metrics, choices=[\"acc\", \"f1-macro\", \"f1-micro\"]\n",
    "    root_dir = '../..' # dir of the source code\n",
    "\n",
    "args = config()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Using backend: pytorch\n"
     ]
    }
   ],
   "source": [
    "import sys\n",
    "sys.path.append(args.root_dir)\n",
    "from train import *"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "start testing on Cora dataset\n",
      "  NumNodes: 2708\n",
      "  NumEdges: 10556\n",
      "  NumFeats: 1433\n",
      "  NumClasses: 7\n",
      "  NumTrainingSamples: 140\n",
      "  NumValidationSamples: 500\n",
      "  NumTestSamples: 1000\n",
      "Done loading data from cached files.\n",
      "time duration = 22.255, best val f1-macro = 0.813, test f1-macro = 0.813\n",
      "time duration = 34.225, best val f1-macro = 0.816, test f1-macro = 0.832\n",
      "time duration = 31.065, best val f1-macro = 0.813, test f1-macro = 0.817\n",
      "time duration = 19.181, best val f1-macro = 0.803, test f1-macro = 0.796\n",
      "time duration = 44.717, best val f1-macro = 0.808, test f1-macro = 0.819\n",
      "time duration = 19.634, best val f1-macro = 0.813, test f1-macro = 0.798\n",
      "time duration = 54.917, best val f1-macro = 0.802, test f1-macro = 0.826\n",
      "time duration = 19.795, best val f1-macro = 0.812, test f1-macro = 0.809\n",
      "time duration = 39.733, best val f1-macro = 0.822, test f1-macro = 0.828\n",
      "time duration = 38.215, best val f1-macro = 0.813, test f1-macro = 0.826\n",
      "time duration = 33.235, best val f1-macro = 0.821, test f1-macro = 0.818\n",
      "time duration = 19.594, best val f1-macro = 0.817, test f1-macro = 0.812\n",
      "time duration = 19.521, best val f1-macro = 0.807, test f1-macro = 0.805\n",
      "time duration = 20.225, best val f1-macro = 0.810, test f1-macro = 0.810\n",
      "time duration = 19.979, best val f1-macro = 0.803, test f1-macro = 0.801\n",
      "time duration = 28.374, best val f1-macro = 0.823, test f1-macro = 0.815\n",
      "time duration = 52.717, best val f1-macro = 0.808, test f1-macro = 0.837\n",
      "time duration = 36.484, best val f1-macro = 0.809, test f1-macro = 0.820\n",
      "time duration = 19.297, best val f1-macro = 0.814, test f1-macro = 0.807\n",
      "time duration = 20.054, best val f1-macro = 0.820, test f1-macro = 0.812\n",
      "time duration = 20.089, best val f1-macro = 0.814, test f1-macro = 0.817\n",
      "time duration = 34.778, best val f1-macro = 0.817, test f1-macro = 0.822\n",
      "time duration = 27.277, best val f1-macro = 0.823, test f1-macro = 0.814\n",
      "time duration = 32.579, best val f1-macro = 0.813, test f1-macro = 0.827\n",
      "time duration = 39.655, best val f1-macro = 0.810, test f1-macro = 0.826\n",
      "time duration = 37.536, best val f1-macro = 0.807, test f1-macro = 0.817\n",
      "time duration = 33.594, best val f1-macro = 0.807, test f1-macro = 0.812\n",
      "time duration = 33.212, best val f1-macro = 0.819, test f1-macro = 0.827\n",
      "time duration = 35.969, best val f1-macro = 0.806, test f1-macro = 0.813\n",
      "time duration = 18.998, best val f1-macro = 0.809, test f1-macro = 0.821\n",
      "test f1-macro (mean, std):  0.8165973474938575 0.009763500198177993\n",
      "test f1-macro (mean, std) after filter:  0.8169169457962546 0.006497885243250747\n",
      "\n",
      "start testing on Citeseer dataset\n",
      "  NumNodes: 3327\n",
      "  NumEdges: 9228\n",
      "  NumFeats: 3703\n",
      "  NumClasses: 6\n",
      "  NumTrainingSamples: 120\n",
      "  NumValidationSamples: 500\n",
      "  NumTestSamples: 1000\n",
      "Done loading data from cached files.\n",
      "time duration = 20.882, best val f1-macro = 0.699, test f1-macro = 0.684\n",
      "time duration = 20.934, best val f1-macro = 0.696, test f1-macro = 0.679\n",
      "time duration = 35.103, best val f1-macro = 0.700, test f1-macro = 0.687\n",
      "time duration = 20.441, best val f1-macro = 0.701, test f1-macro = 0.677\n",
      "time duration = 20.149, best val f1-macro = 0.699, test f1-macro = 0.685\n",
      "time duration = 21.296, best val f1-macro = 0.702, test f1-macro = 0.680\n",
      "time duration = 20.688, best val f1-macro = 0.699, test f1-macro = 0.673\n",
      "time duration = 20.882, best val f1-macro = 0.716, test f1-macro = 0.684\n",
      "time duration = 20.031, best val f1-macro = 0.703, test f1-macro = 0.684\n",
      "time duration = 20.162, best val f1-macro = 0.704, test f1-macro = 0.676\n",
      "time duration = 26.104, best val f1-macro = 0.699, test f1-macro = 0.677\n",
      "time duration = 23.736, best val f1-macro = 0.702, test f1-macro = 0.680\n",
      "time duration = 20.784, best val f1-macro = 0.703, test f1-macro = 0.670\n",
      "time duration = 26.149, best val f1-macro = 0.690, test f1-macro = 0.689\n",
      "time duration = 20.795, best val f1-macro = 0.702, test f1-macro = 0.680\n",
      "time duration = 35.307, best val f1-macro = 0.700, test f1-macro = 0.686\n",
      "time duration = 20.409, best val f1-macro = 0.706, test f1-macro = 0.674\n",
      "time duration = 19.124, best val f1-macro = 0.718, test f1-macro = 0.672\n",
      "time duration = 33.638, best val f1-macro = 0.694, test f1-macro = 0.678\n",
      "time duration = 20.152, best val f1-macro = 0.704, test f1-macro = 0.679\n",
      "time duration = 20.535, best val f1-macro = 0.705, test f1-macro = 0.682\n",
      "time duration = 21.952, best val f1-macro = 0.711, test f1-macro = 0.683\n",
      "time duration = 21.103, best val f1-macro = 0.702, test f1-macro = 0.681\n",
      "time duration = 25.420, best val f1-macro = 0.705, test f1-macro = 0.692\n",
      "time duration = 19.867, best val f1-macro = 0.703, test f1-macro = 0.666\n",
      "time duration = 20.744, best val f1-macro = 0.715, test f1-macro = 0.684\n",
      "time duration = 29.590, best val f1-macro = 0.698, test f1-macro = 0.684\n",
      "time duration = 28.575, best val f1-macro = 0.699, test f1-macro = 0.683\n",
      "time duration = 20.975, best val f1-macro = 0.703, test f1-macro = 0.683\n",
      "time duration = 24.651, best val f1-macro = 0.704, test f1-macro = 0.677\n",
      "test f1-macro (mean, std):  0.6802492710627022 0.005625905868138413\n",
      "test f1-macro (mean, std) after filter:  0.6804852088551107 0.003562238111504118\n",
      "\n",
      "start testing on Pubmed dataset\n",
      "  NumNodes: 19717\n",
      "  NumEdges: 88651\n",
      "  NumFeats: 500\n",
      "  NumClasses: 3\n",
      "  NumTrainingSamples: 60\n",
      "  NumValidationSamples: 500\n",
      "  NumTestSamples: 1000\n",
      "Done loading data from cached files.\n",
      "time duration = 66.009, best val f1-macro = 0.834, test f1-macro = 0.789\n",
      "time duration = 71.421, best val f1-macro = 0.832, test f1-macro = 0.791\n",
      "time duration = 76.139, best val f1-macro = 0.830, test f1-macro = 0.783\n",
      "time duration = 39.456, best val f1-macro = 0.828, test f1-macro = 0.787\n",
      "time duration = 70.873, best val f1-macro = 0.829, test f1-macro = 0.786\n",
      "time duration = 77.499, best val f1-macro = 0.829, test f1-macro = 0.787\n",
      "time duration = 49.188, best val f1-macro = 0.825, test f1-macro = 0.786\n",
      "time duration = 48.114, best val f1-macro = 0.828, test f1-macro = 0.788\n",
      "time duration = 39.422, best val f1-macro = 0.825, test f1-macro = 0.788\n",
      "time duration = 40.469, best val f1-macro = 0.822, test f1-macro = 0.783\n",
      "time duration = 39.152, best val f1-macro = 0.824, test f1-macro = 0.784\n",
      "time duration = 38.838, best val f1-macro = 0.828, test f1-macro = 0.787\n",
      "time duration = 39.731, best val f1-macro = 0.826, test f1-macro = 0.781\n",
      "time duration = 64.531, best val f1-macro = 0.825, test f1-macro = 0.776\n",
      "time duration = 40.124, best val f1-macro = 0.823, test f1-macro = 0.787\n",
      "time duration = 69.682, best val f1-macro = 0.830, test f1-macro = 0.783\n",
      "time duration = 61.374, best val f1-macro = 0.828, test f1-macro = 0.781\n",
      "time duration = 60.724, best val f1-macro = 0.833, test f1-macro = 0.788\n",
      "time duration = 41.771, best val f1-macro = 0.832, test f1-macro = 0.781\n",
      "time duration = 50.794, best val f1-macro = 0.830, test f1-macro = 0.789\n",
      "time duration = 57.471, best val f1-macro = 0.830, test f1-macro = 0.792\n",
      "time duration = 44.934, best val f1-macro = 0.836, test f1-macro = 0.790\n",
      "time duration = 66.113, best val f1-macro = 0.827, test f1-macro = 0.782\n",
      "time duration = 49.560, best val f1-macro = 0.825, test f1-macro = 0.783\n",
      "time duration = 56.984, best val f1-macro = 0.831, test f1-macro = 0.788\n",
      "time duration = 96.516, best val f1-macro = 0.822, test f1-macro = 0.790\n",
      "time duration = 58.136, best val f1-macro = 0.830, test f1-macro = 0.786\n",
      "time duration = 39.998, best val f1-macro = 0.829, test f1-macro = 0.786\n",
      "time duration = 47.853, best val f1-macro = 0.825, test f1-macro = 0.790\n",
      "time duration = 39.678, best val f1-macro = 0.827, test f1-macro = 0.791\n",
      "test f1-macro (mean, std):  0.786163159580862 0.003752315139804137\n",
      "test f1-macro (mean, std) after filter:  0.7863422577703193 0.002684882419457415\n",
      "\n",
      "start testing on Coauthor-CS dataset with random split: 0\n",
      "time duration = 53.843, best val f1-macro = 0.914, test f1-macro = 0.904\n",
      "time duration = 52.937, best val f1-macro = 0.917, test f1-macro = 0.901\n",
      "time duration = 52.376, best val f1-macro = 0.910, test f1-macro = 0.901\n",
      "time duration = 57.624, best val f1-macro = 0.914, test f1-macro = 0.903\n",
      "time duration = 52.846, best val f1-macro = 0.909, test f1-macro = 0.905\n",
      "time duration = 65.906, best val f1-macro = 0.914, test f1-macro = 0.901\n",
      "time duration = 52.576, best val f1-macro = 0.904, test f1-macro = 0.905\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "time duration = 53.772, best val f1-macro = 0.908, test f1-macro = 0.898\n",
      "time duration = 105.011, best val f1-macro = 0.914, test f1-macro = 0.907\n",
      "time duration = 59.700, best val f1-macro = 0.903, test f1-macro = 0.897\n",
      "time duration = 55.101, best val f1-macro = 0.922, test f1-macro = 0.905\n",
      "time duration = 53.630, best val f1-macro = 0.910, test f1-macro = 0.895\n",
      "time duration = 53.440, best val f1-macro = 0.920, test f1-macro = 0.906\n",
      "time duration = 55.870, best val f1-macro = 0.918, test f1-macro = 0.906\n",
      "time duration = 89.815, best val f1-macro = 0.916, test f1-macro = 0.908\n",
      "time duration = 51.176, best val f1-macro = 0.874, test f1-macro = 0.843\n",
      "time duration = 56.950, best val f1-macro = 0.914, test f1-macro = 0.906\n",
      "time duration = 93.922, best val f1-macro = 0.916, test f1-macro = 0.906\n",
      "time duration = 51.878, best val f1-macro = 0.907, test f1-macro = 0.893\n",
      "time duration = 53.808, best val f1-macro = 0.910, test f1-macro = 0.899\n",
      "time duration = 59.394, best val f1-macro = 0.911, test f1-macro = 0.887\n",
      "time duration = 82.258, best val f1-macro = 0.903, test f1-macro = 0.903\n",
      "time duration = 62.918, best val f1-macro = 0.915, test f1-macro = 0.906\n",
      "time duration = 50.705, best val f1-macro = 0.835, test f1-macro = 0.850\n",
      "time duration = 167.567, best val f1-macro = 0.923, test f1-macro = 0.902\n",
      "time duration = 61.471, best val f1-macro = 0.914, test f1-macro = 0.905\n",
      "time duration = 62.620, best val f1-macro = 0.914, test f1-macro = 0.911\n",
      "time duration = 79.093, best val f1-macro = 0.904, test f1-macro = 0.900\n",
      "time duration = 53.402, best val f1-macro = 0.922, test f1-macro = 0.903\n",
      "time duration = 52.554, best val f1-macro = 0.905, test f1-macro = 0.900\n",
      "test f1-macro (mean, std):  0.8984999075392508 0.014795020580274522\n",
      "test f1-macro (mean, std) after filter:  0.9021011757623159 0.0035852265975477196\n",
      "\n",
      "start testing on Coauthor-CS dataset with random split: 1\n",
      "time duration = 52.694, best val f1-macro = 0.931, test f1-macro = 0.905\n",
      "time duration = 104.171, best val f1-macro = 0.936, test f1-macro = 0.905\n",
      "time duration = 109.631, best val f1-macro = 0.947, test f1-macro = 0.910\n",
      "time duration = 67.906, best val f1-macro = 0.941, test f1-macro = 0.907\n",
      "time duration = 110.560, best val f1-macro = 0.941, test f1-macro = 0.902\n",
      "time duration = 68.800, best val f1-macro = 0.938, test f1-macro = 0.909\n",
      "time duration = 56.439, best val f1-macro = 0.940, test f1-macro = 0.905\n",
      "time duration = 52.933, best val f1-macro = 0.943, test f1-macro = 0.906\n",
      "time duration = 56.932, best val f1-macro = 0.936, test f1-macro = 0.898\n",
      "time duration = 66.395, best val f1-macro = 0.943, test f1-macro = 0.911\n",
      "time duration = 53.104, best val f1-macro = 0.934, test f1-macro = 0.900\n",
      "time duration = 53.860, best val f1-macro = 0.932, test f1-macro = 0.902\n",
      "time duration = 52.715, best val f1-macro = 0.931, test f1-macro = 0.904\n",
      "time duration = 65.126, best val f1-macro = 0.936, test f1-macro = 0.907\n",
      "time duration = 52.563, best val f1-macro = 0.934, test f1-macro = 0.906\n",
      "time duration = 153.318, best val f1-macro = 0.949, test f1-macro = 0.913\n",
      "time duration = 56.603, best val f1-macro = 0.929, test f1-macro = 0.898\n",
      "time duration = 104.191, best val f1-macro = 0.945, test f1-macro = 0.906\n",
      "time duration = 52.363, best val f1-macro = 0.933, test f1-macro = 0.906\n",
      "time duration = 75.037, best val f1-macro = 0.945, test f1-macro = 0.908\n",
      "time duration = 58.218, best val f1-macro = 0.932, test f1-macro = 0.905\n",
      "time duration = 53.070, best val f1-macro = 0.929, test f1-macro = 0.900\n",
      "time duration = 77.490, best val f1-macro = 0.942, test f1-macro = 0.910\n",
      "time duration = 57.643, best val f1-macro = 0.936, test f1-macro = 0.911\n",
      "time duration = 122.325, best val f1-macro = 0.951, test f1-macro = 0.908\n",
      "time duration = 109.524, best val f1-macro = 0.943, test f1-macro = 0.907\n",
      "time duration = 56.635, best val f1-macro = 0.938, test f1-macro = 0.900\n",
      "time duration = 52.855, best val f1-macro = 0.934, test f1-macro = 0.904\n",
      "time duration = 52.412, best val f1-macro = 0.942, test f1-macro = 0.910\n",
      "time duration = 76.569, best val f1-macro = 0.931, test f1-macro = 0.902\n",
      "test f1-macro (mean, std):  0.9055582747018237 0.003955236993852039\n",
      "test f1-macro (mean, std) after filter:  0.9056995956174688 0.0028930822829977\n",
      "\n",
      "start testing on Coauthor-CS dataset with random split: 2\n",
      "time duration = 52.156, best val f1-macro = 0.905, test f1-macro = 0.895\n",
      "time duration = 68.889, best val f1-macro = 0.917, test f1-macro = 0.899\n",
      "time duration = 51.598, best val f1-macro = 0.919, test f1-macro = 0.894\n",
      "time duration = 60.698, best val f1-macro = 0.908, test f1-macro = 0.901\n",
      "time duration = 70.453, best val f1-macro = 0.914, test f1-macro = 0.901\n",
      "time duration = 59.618, best val f1-macro = 0.917, test f1-macro = 0.900\n",
      "time duration = 100.814, best val f1-macro = 0.914, test f1-macro = 0.899\n",
      "time duration = 52.112, best val f1-macro = 0.908, test f1-macro = 0.896\n",
      "time duration = 64.335, best val f1-macro = 0.923, test f1-macro = 0.898\n",
      "time duration = 52.037, best val f1-macro = 0.917, test f1-macro = 0.894\n",
      "time duration = 62.336, best val f1-macro = 0.922, test f1-macro = 0.903\n",
      "time duration = 59.251, best val f1-macro = 0.910, test f1-macro = 0.885\n",
      "time duration = 58.759, best val f1-macro = 0.909, test f1-macro = 0.901\n",
      "time duration = 69.150, best val f1-macro = 0.914, test f1-macro = 0.900\n",
      "time duration = 99.618, best val f1-macro = 0.923, test f1-macro = 0.900\n",
      "time duration = 83.105, best val f1-macro = 0.918, test f1-macro = 0.896\n",
      "time duration = 52.171, best val f1-macro = 0.921, test f1-macro = 0.893\n",
      "time duration = 73.154, best val f1-macro = 0.914, test f1-macro = 0.896\n",
      "time duration = 53.673, best val f1-macro = 0.908, test f1-macro = 0.888\n",
      "time duration = 66.287, best val f1-macro = 0.919, test f1-macro = 0.903\n",
      "time duration = 89.773, best val f1-macro = 0.916, test f1-macro = 0.899\n",
      "time duration = 98.079, best val f1-macro = 0.915, test f1-macro = 0.902\n",
      "time duration = 51.928, best val f1-macro = 0.910, test f1-macro = 0.893\n",
      "time duration = 52.799, best val f1-macro = 0.919, test f1-macro = 0.899\n",
      "time duration = 82.686, best val f1-macro = 0.929, test f1-macro = 0.898\n",
      "time duration = 53.579, best val f1-macro = 0.908, test f1-macro = 0.897\n",
      "time duration = 64.124, best val f1-macro = 0.913, test f1-macro = 0.893\n",
      "time duration = 57.999, best val f1-macro = 0.915, test f1-macro = 0.901\n",
      "time duration = 53.157, best val f1-macro = 0.915, test f1-macro = 0.899\n",
      "time duration = 67.332, best val f1-macro = 0.919, test f1-macro = 0.901\n",
      "test f1-macro (mean, std):  0.8974899142369879 0.004144022219418352\n",
      "test f1-macro (mean, std) after filter:  0.897959174066426 0.0026563919354495864\n"
     ]
    }
   ],
   "source": [
    "accs = []\n",
    "datasets = ['Cora', 'Citeseer', 'Pubmed', 'Coauthor-CS']\n",
    "for dataset in datasets:\n",
    "    args.data = dataset\n",
    "    if dataset == 'Cora':\n",
    "        args.dropout = 0.6\n",
    "        args.dropout2 = 0\n",
    "        args.weight_decay = 5e-4\n",
    "        print('\\nstart testing on ' + dataset + ' dataset')\n",
    "        accs.append(main(args))\n",
    "    elif dataset == 'Citeseer':\n",
    "        args.dropout = 0.6\n",
    "        args.dropout2 = 0\n",
    "        args.weight_decay = 5e-4\n",
    "        print('\\nstart testing on ' + dataset + ' dataset')\n",
    "        accs.append(main(args))\n",
    "    elif dataset == 'Pubmed':\n",
    "        args.dropout = 0.6\n",
    "        args.dropout2 = 0\n",
    "        args.weight_decay = 5e-4\n",
    "        print('\\nstart testing on ' + dataset + ' dataset')\n",
    "        accs.append(main(args))\n",
    "    elif dataset == 'Coauthor-CS':\n",
    "        args.dropout = 0.2\n",
    "        args.dropout2 = 0.2\n",
    "        args.weight_decay = 5e-3\n",
    "        for i in range(3):\n",
    "            print('\\nstart testing on ' + dataset + ' dataset with random split: ' + str(i))\n",
    "            args.test_id = i\n",
    "            accs.append(main(args))\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "accs = np.array(accs)\n",
    "np.savetxt('log_f1_macro/f1-macro_GTAN_hop10-copy1.txt',accs)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
