{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "class config:\n",
    "    data = 'Cora' #choices=[\"Cora\", \"Citeseer\", \"Pubmed\", \"Coauthor-CS\"]\n",
    "    model = 'TreeLSTM' #choices=[\"GCN\", \"GAT\", \"APPNP\", \"DAGNN\", \"TreeLSTM\", \"GTCN\", \"GTAN\", \"GTCN2\"]\n",
    "    n_in = 0\n",
    "    n_hid = 64\n",
    "    n_out = 0\n",
    "    num_heads = 1\n",
    "    num_out_heads = 1\n",
    "    device = 'cpu'\n",
    "    dropout = 0.8\n",
    "    dropout2 = 0.6\n",
    "    learning_rate = 0.01\n",
    "    weight_decay = 5e-4\n",
    "    patience = 200\n",
    "    num_iter = 1000\n",
    "    num_test = 30\n",
    "    hop = 2\n",
    "    alpha = 0.1 # used by APPNP only\n",
    "    random_label_split = False\n",
    "    num_train = 20 # for random label split only\n",
    "    num_val = 30 # for random label split only\n",
    "    data_load = True # load the saved label split to rerun the test (for reproduce purpose)\n",
    "    test_id = 1 # number of the test, only used to record the ith number of the random label split (for reproduce purpose)\n",
    "    filter_pct = 0.1 # remove the top and bottom filer_pct points before obtaining statistics of test accuracy\n",
    "    log = False # whether to show the training log or not\n",
    "    eval_metric = 'f1-macro' # evaluation metrics, choices=[\"acc\", \"f1-macro\", \"f1-micro\"]\n",
    "    root_dir = '../..' # dir of the source code\n",
    "\n",
    "args = config()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Using backend: pytorch\n"
     ]
    }
   ],
   "source": [
    "import sys\n",
    "sys.path.append(args.root_dir)\n",
    "from train import *"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "start testing on Cora dataset\n",
      "  NumNodes: 2708\n",
      "  NumEdges: 10556\n",
      "  NumFeats: 1433\n",
      "  NumClasses: 7\n",
      "  NumTrainingSamples: 140\n",
      "  NumValidationSamples: 500\n",
      "  NumTestSamples: 1000\n",
      "Done loading data from cached files.\n",
      "time duration = 11.288, best val f1-macro = 0.805, test f1-macro = 0.796\n",
      "time duration = 7.264, best val f1-macro = 0.801, test f1-macro = 0.803\n",
      "time duration = 5.905, best val f1-macro = 0.800, test f1-macro = 0.824\n",
      "time duration = 5.147, best val f1-macro = 0.807, test f1-macro = 0.817\n",
      "time duration = 4.989, best val f1-macro = 0.805, test f1-macro = 0.808\n",
      "time duration = 5.085, best val f1-macro = 0.793, test f1-macro = 0.803\n",
      "time duration = 6.951, best val f1-macro = 0.810, test f1-macro = 0.807\n",
      "time duration = 5.172, best val f1-macro = 0.802, test f1-macro = 0.817\n",
      "time duration = 8.973, best val f1-macro = 0.806, test f1-macro = 0.781\n",
      "time duration = 5.579, best val f1-macro = 0.799, test f1-macro = 0.817\n",
      "time duration = 6.751, best val f1-macro = 0.809, test f1-macro = 0.805\n",
      "time duration = 6.490, best val f1-macro = 0.807, test f1-macro = 0.815\n",
      "time duration = 5.759, best val f1-macro = 0.793, test f1-macro = 0.797\n",
      "time duration = 10.265, best val f1-macro = 0.799, test f1-macro = 0.791\n",
      "time duration = 5.591, best val f1-macro = 0.796, test f1-macro = 0.821\n",
      "time duration = 9.206, best val f1-macro = 0.802, test f1-macro = 0.808\n",
      "time duration = 5.865, best val f1-macro = 0.806, test f1-macro = 0.797\n",
      "time duration = 6.264, best val f1-macro = 0.807, test f1-macro = 0.807\n",
      "time duration = 6.725, best val f1-macro = 0.809, test f1-macro = 0.803\n",
      "time duration = 6.393, best val f1-macro = 0.798, test f1-macro = 0.799\n",
      "time duration = 7.136, best val f1-macro = 0.802, test f1-macro = 0.803\n",
      "time duration = 8.406, best val f1-macro = 0.812, test f1-macro = 0.807\n",
      "time duration = 8.403, best val f1-macro = 0.807, test f1-macro = 0.806\n",
      "time duration = 6.867, best val f1-macro = 0.812, test f1-macro = 0.817\n",
      "time duration = 8.497, best val f1-macro = 0.799, test f1-macro = 0.802\n",
      "time duration = 7.245, best val f1-macro = 0.801, test f1-macro = 0.803\n",
      "time duration = 5.677, best val f1-macro = 0.800, test f1-macro = 0.821\n",
      "time duration = 6.790, best val f1-macro = 0.795, test f1-macro = 0.803\n",
      "time duration = 8.155, best val f1-macro = 0.802, test f1-macro = 0.807\n",
      "time duration = 5.206, best val f1-macro = 0.807, test f1-macro = 0.816\n",
      "test f1-macro (mean, std):  0.8066563792681863 0.009365416588674067\n",
      "test f1-macro (mean, std) after filter:  0.806929903201114 0.0061896584535690155\n",
      "\n",
      "start testing on Citeseer dataset\n",
      "  NumNodes: 3327\n",
      "  NumEdges: 9228\n",
      "  NumFeats: 3703\n",
      "  NumClasses: 6\n",
      "  NumTrainingSamples: 120\n",
      "  NumValidationSamples: 500\n",
      "  NumTestSamples: 1000\n",
      "Done loading data from cached files.\n",
      "time duration = 10.284, best val f1-macro = 0.660, test f1-macro = 0.636\n",
      "time duration = 11.175, best val f1-macro = 0.670, test f1-macro = 0.637\n",
      "time duration = 8.777, best val f1-macro = 0.654, test f1-macro = 0.641\n",
      "time duration = 9.642, best val f1-macro = 0.660, test f1-macro = 0.657\n",
      "time duration = 11.137, best val f1-macro = 0.650, test f1-macro = 0.642\n",
      "time duration = 9.260, best val f1-macro = 0.674, test f1-macro = 0.649\n",
      "time duration = 10.064, best val f1-macro = 0.672, test f1-macro = 0.650\n",
      "time duration = 9.178, best val f1-macro = 0.659, test f1-macro = 0.636\n",
      "time duration = 16.621, best val f1-macro = 0.660, test f1-macro = 0.627\n",
      "time duration = 9.372, best val f1-macro = 0.682, test f1-macro = 0.653\n",
      "time duration = 8.892, best val f1-macro = 0.663, test f1-macro = 0.640\n",
      "time duration = 9.752, best val f1-macro = 0.652, test f1-macro = 0.634\n",
      "time duration = 10.537, best val f1-macro = 0.666, test f1-macro = 0.647\n",
      "time duration = 9.307, best val f1-macro = 0.655, test f1-macro = 0.645\n",
      "time duration = 9.674, best val f1-macro = 0.658, test f1-macro = 0.638\n",
      "time duration = 10.174, best val f1-macro = 0.659, test f1-macro = 0.634\n",
      "time duration = 11.702, best val f1-macro = 0.650, test f1-macro = 0.640\n",
      "time duration = 10.195, best val f1-macro = 0.676, test f1-macro = 0.653\n",
      "time duration = 16.597, best val f1-macro = 0.662, test f1-macro = 0.619\n",
      "time duration = 15.882, best val f1-macro = 0.663, test f1-macro = 0.625\n",
      "time duration = 9.361, best val f1-macro = 0.678, test f1-macro = 0.657\n",
      "time duration = 9.061, best val f1-macro = 0.665, test f1-macro = 0.625\n",
      "time duration = 9.425, best val f1-macro = 0.677, test f1-macro = 0.659\n",
      "time duration = 9.544, best val f1-macro = 0.642, test f1-macro = 0.635\n",
      "time duration = 10.245, best val f1-macro = 0.659, test f1-macro = 0.662\n",
      "time duration = 9.471, best val f1-macro = 0.681, test f1-macro = 0.653\n",
      "time duration = 9.470, best val f1-macro = 0.672, test f1-macro = 0.651\n",
      "time duration = 9.013, best val f1-macro = 0.664, test f1-macro = 0.634\n",
      "time duration = 14.773, best val f1-macro = 0.661, test f1-macro = 0.624\n",
      "time duration = 9.790, best val f1-macro = 0.666, test f1-macro = 0.652\n",
      "test f1-macro (mean, std):  0.6419096790651782 0.01133772676172716\n",
      "test f1-macro (mean, std) after filter:  0.6421441749362454 0.008633386132016255\n",
      "\n",
      "start testing on Pubmed dataset\n",
      "  NumNodes: 19717\n",
      "  NumEdges: 88651\n",
      "  NumFeats: 500\n",
      "  NumClasses: 3\n",
      "  NumTrainingSamples: 60\n",
      "  NumValidationSamples: 500\n",
      "  NumTestSamples: 1000\n",
      "Done loading data from cached files.\n",
      "time duration = 13.295, best val f1-macro = 0.790, test f1-macro = 0.750\n",
      "time duration = 13.358, best val f1-macro = 0.787, test f1-macro = 0.760\n",
      "time duration = 13.093, best val f1-macro = 0.795, test f1-macro = 0.757\n",
      "time duration = 14.094, best val f1-macro = 0.791, test f1-macro = 0.770\n",
      "time duration = 12.643, best val f1-macro = 0.796, test f1-macro = 0.762\n",
      "time duration = 12.934, best val f1-macro = 0.792, test f1-macro = 0.756\n",
      "time duration = 16.705, best val f1-macro = 0.791, test f1-macro = 0.755\n",
      "time duration = 19.041, best val f1-macro = 0.793, test f1-macro = 0.762\n",
      "time duration = 24.270, best val f1-macro = 0.798, test f1-macro = 0.771\n",
      "time duration = 13.458, best val f1-macro = 0.799, test f1-macro = 0.762\n",
      "time duration = 20.433, best val f1-macro = 0.799, test f1-macro = 0.771\n",
      "time duration = 18.367, best val f1-macro = 0.791, test f1-macro = 0.772\n",
      "time duration = 12.853, best val f1-macro = 0.795, test f1-macro = 0.756\n",
      "time duration = 20.931, best val f1-macro = 0.792, test f1-macro = 0.763\n",
      "time duration = 17.664, best val f1-macro = 0.793, test f1-macro = 0.765\n",
      "time duration = 13.630, best val f1-macro = 0.785, test f1-macro = 0.749\n",
      "time duration = 21.805, best val f1-macro = 0.793, test f1-macro = 0.760\n",
      "time duration = 20.719, best val f1-macro = 0.795, test f1-macro = 0.767\n",
      "time duration = 20.156, best val f1-macro = 0.790, test f1-macro = 0.760\n",
      "time duration = 12.419, best val f1-macro = 0.791, test f1-macro = 0.755\n",
      "time duration = 13.518, best val f1-macro = 0.793, test f1-macro = 0.752\n",
      "time duration = 12.904, best val f1-macro = 0.798, test f1-macro = 0.765\n",
      "time duration = 21.434, best val f1-macro = 0.793, test f1-macro = 0.762\n",
      "time duration = 19.438, best val f1-macro = 0.798, test f1-macro = 0.761\n",
      "time duration = 14.161, best val f1-macro = 0.787, test f1-macro = 0.772\n",
      "time duration = 13.606, best val f1-macro = 0.794, test f1-macro = 0.751\n",
      "time duration = 18.036, best val f1-macro = 0.798, test f1-macro = 0.773\n",
      "time duration = 14.704, best val f1-macro = 0.803, test f1-macro = 0.773\n",
      "time duration = 18.156, best val f1-macro = 0.791, test f1-macro = 0.762\n",
      "time duration = 12.636, best val f1-macro = 0.797, test f1-macro = 0.751\n",
      "test f1-macro (mean, std):  0.7615076131798174 0.00732193988543801\n",
      "test f1-macro (mean, std) after filter:  0.7615516358928814 0.005820264487355179\n",
      "\n",
      "start testing on Coauthor-CS dataset with random split: 0\n",
      "time duration = 56.970, best val f1-macro = 0.895, test f1-macro = 0.885\n",
      "time duration = 67.783, best val f1-macro = 0.893, test f1-macro = 0.896\n",
      "time duration = 58.618, best val f1-macro = 0.893, test f1-macro = 0.891\n",
      "time duration = 67.314, best val f1-macro = 0.897, test f1-macro = 0.891\n",
      "time duration = 58.054, best val f1-macro = 0.893, test f1-macro = 0.889\n",
      "time duration = 152.350, best val f1-macro = 0.891, test f1-macro = 0.886\n",
      "time duration = 55.727, best val f1-macro = 0.895, test f1-macro = 0.873\n",
      "time duration = 57.651, best val f1-macro = 0.894, test f1-macro = 0.888\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "time duration = 55.965, best val f1-macro = 0.900, test f1-macro = 0.884\n",
      "time duration = 56.418, best val f1-macro = 0.898, test f1-macro = 0.889\n",
      "time duration = 56.699, best val f1-macro = 0.900, test f1-macro = 0.886\n",
      "time duration = 56.916, best val f1-macro = 0.897, test f1-macro = 0.891\n",
      "time duration = 68.026, best val f1-macro = 0.895, test f1-macro = 0.893\n",
      "time duration = 73.483, best val f1-macro = 0.897, test f1-macro = 0.892\n",
      "time duration = 57.183, best val f1-macro = 0.909, test f1-macro = 0.889\n",
      "time duration = 67.226, best val f1-macro = 0.892, test f1-macro = 0.890\n",
      "time duration = 56.006, best val f1-macro = 0.905, test f1-macro = 0.891\n",
      "time duration = 56.261, best val f1-macro = 0.893, test f1-macro = 0.883\n",
      "time duration = 67.256, best val f1-macro = 0.895, test f1-macro = 0.890\n",
      "time duration = 80.429, best val f1-macro = 0.895, test f1-macro = 0.890\n",
      "time duration = 99.252, best val f1-macro = 0.895, test f1-macro = 0.891\n",
      "time duration = 55.822, best val f1-macro = 0.892, test f1-macro = 0.882\n",
      "time duration = 58.392, best val f1-macro = 0.898, test f1-macro = 0.888\n",
      "time duration = 60.713, best val f1-macro = 0.898, test f1-macro = 0.889\n",
      "time duration = 57.675, best val f1-macro = 0.894, test f1-macro = 0.891\n",
      "time duration = 96.861, best val f1-macro = 0.893, test f1-macro = 0.884\n",
      "time duration = 56.495, best val f1-macro = 0.900, test f1-macro = 0.889\n",
      "time duration = 56.350, best val f1-macro = 0.893, test f1-macro = 0.891\n",
      "time duration = 84.921, best val f1-macro = 0.891, test f1-macro = 0.886\n",
      "time duration = 55.718, best val f1-macro = 0.893, test f1-macro = 0.885\n",
      "test f1-macro (mean, std):  0.8881066541905086 0.004265913012365632\n",
      "test f1-macro (mean, std) after filter:  0.8884680069014183 0.0024311654939080177\n",
      "\n",
      "start testing on Coauthor-CS dataset with random split: 1\n",
      "time duration = 58.807, best val f1-macro = 0.918, test f1-macro = 0.889\n",
      "time duration = 119.218, best val f1-macro = 0.914, test f1-macro = 0.883\n",
      "time duration = 101.501, best val f1-macro = 0.916, test f1-macro = 0.879\n",
      "time duration = 57.611, best val f1-macro = 0.913, test f1-macro = 0.885\n",
      "time duration = 61.888, best val f1-macro = 0.918, test f1-macro = 0.884\n",
      "time duration = 63.004, best val f1-macro = 0.927, test f1-macro = 0.886\n",
      "time duration = 63.712, best val f1-macro = 0.916, test f1-macro = 0.886\n",
      "time duration = 58.703, best val f1-macro = 0.916, test f1-macro = 0.886\n",
      "time duration = 155.662, best val f1-macro = 0.916, test f1-macro = 0.885\n",
      "time duration = 60.377, best val f1-macro = 0.918, test f1-macro = 0.888\n",
      "time duration = 63.880, best val f1-macro = 0.921, test f1-macro = 0.891\n",
      "time duration = 72.525, best val f1-macro = 0.916, test f1-macro = 0.882\n",
      "time duration = 85.403, best val f1-macro = 0.907, test f1-macro = 0.881\n",
      "time duration = 70.579, best val f1-macro = 0.911, test f1-macro = 0.882\n",
      "time duration = 62.070, best val f1-macro = 0.914, test f1-macro = 0.886\n",
      "time duration = 69.107, best val f1-macro = 0.913, test f1-macro = 0.886\n",
      "time duration = 63.999, best val f1-macro = 0.922, test f1-macro = 0.882\n",
      "time duration = 65.002, best val f1-macro = 0.909, test f1-macro = 0.889\n",
      "time duration = 60.844, best val f1-macro = 0.911, test f1-macro = 0.886\n",
      "time duration = 68.413, best val f1-macro = 0.914, test f1-macro = 0.881\n",
      "time duration = 62.681, best val f1-macro = 0.918, test f1-macro = 0.887\n",
      "time duration = 63.677, best val f1-macro = 0.920, test f1-macro = 0.885\n",
      "time duration = 67.184, best val f1-macro = 0.922, test f1-macro = 0.885\n",
      "time duration = 64.983, best val f1-macro = 0.918, test f1-macro = 0.881\n",
      "time duration = 159.044, best val f1-macro = 0.913, test f1-macro = 0.885\n",
      "time duration = 60.024, best val f1-macro = 0.914, test f1-macro = 0.884\n",
      "time duration = 68.818, best val f1-macro = 0.918, test f1-macro = 0.886\n",
      "time duration = 93.169, best val f1-macro = 0.914, test f1-macro = 0.884\n",
      "time duration = 57.740, best val f1-macro = 0.914, test f1-macro = 0.886\n",
      "time duration = 120.558, best val f1-macro = 0.922, test f1-macro = 0.887\n",
      "test f1-macro (mean, std):  0.884895188011479 0.002597146964445374\n",
      "test f1-macro (mean, std) after filter:  0.8848978247700773 0.0016634144722311587\n",
      "\n",
      "start testing on Coauthor-CS dataset with random split: 2\n",
      "time duration = 145.278, best val f1-macro = 0.901, test f1-macro = 0.879\n",
      "time duration = 58.072, best val f1-macro = 0.906, test f1-macro = 0.885\n",
      "time duration = 185.984, best val f1-macro = 0.908, test f1-macro = 0.885\n",
      "time duration = 99.271, best val f1-macro = 0.905, test f1-macro = 0.885\n",
      "time duration = 133.107, best val f1-macro = 0.903, test f1-macro = 0.880\n",
      "time duration = 66.094, best val f1-macro = 0.904, test f1-macro = 0.882\n",
      "time duration = 126.438, best val f1-macro = 0.907, test f1-macro = 0.872\n",
      "time duration = 79.710, best val f1-macro = 0.905, test f1-macro = 0.882\n",
      "time duration = 72.164, best val f1-macro = 0.901, test f1-macro = 0.880\n",
      "time duration = 133.354, best val f1-macro = 0.910, test f1-macro = 0.879\n",
      "time duration = 78.897, best val f1-macro = 0.908, test f1-macro = 0.883\n",
      "time duration = 73.208, best val f1-macro = 0.905, test f1-macro = 0.885\n",
      "time duration = 116.206, best val f1-macro = 0.901, test f1-macro = 0.874\n",
      "time duration = 94.861, best val f1-macro = 0.905, test f1-macro = 0.883\n",
      "time duration = 78.592, best val f1-macro = 0.896, test f1-macro = 0.881\n",
      "time duration = 143.914, best val f1-macro = 0.901, test f1-macro = 0.878\n",
      "time duration = 156.093, best val f1-macro = 0.904, test f1-macro = 0.877\n",
      "time duration = 90.398, best val f1-macro = 0.907, test f1-macro = 0.881\n",
      "time duration = 66.573, best val f1-macro = 0.908, test f1-macro = 0.886\n",
      "time duration = 58.116, best val f1-macro = 0.904, test f1-macro = 0.886\n",
      "time duration = 87.610, best val f1-macro = 0.904, test f1-macro = 0.881\n",
      "time duration = 82.625, best val f1-macro = 0.912, test f1-macro = 0.883\n",
      "time duration = 108.561, best val f1-macro = 0.906, test f1-macro = 0.876\n",
      "time duration = 80.984, best val f1-macro = 0.901, test f1-macro = 0.882\n",
      "time duration = 63.714, best val f1-macro = 0.906, test f1-macro = 0.878\n",
      "time duration = 67.758, best val f1-macro = 0.908, test f1-macro = 0.884\n",
      "time duration = 77.808, best val f1-macro = 0.904, test f1-macro = 0.884\n",
      "time duration = 129.263, best val f1-macro = 0.907, test f1-macro = 0.881\n",
      "time duration = 70.969, best val f1-macro = 0.901, test f1-macro = 0.882\n",
      "time duration = 131.238, best val f1-macro = 0.907, test f1-macro = 0.879\n",
      "test f1-macro (mean, std):  0.8810447539653729 0.003389473875540811\n",
      "test f1-macro (mean, std) after filter:  0.8813516773319495 0.002211650191215212\n"
     ]
    }
   ],
   "source": [
    "accs = []\n",
    "datasets = ['Cora', 'Citeseer', 'Pubmed', 'Coauthor-CS']\n",
    "for dataset in datasets:\n",
    "    args.data = dataset\n",
    "    if dataset == 'Cora':\n",
    "        print('\\nstart testing on ' + dataset + ' dataset')\n",
    "        accs.append(main(args))\n",
    "    elif dataset == 'Citeseer':\n",
    "        print('\\nstart testing on ' + dataset + ' dataset')\n",
    "        accs.append(main(args))\n",
    "    elif dataset == 'Pubmed':\n",
    "        print('\\nstart testing on ' + dataset + ' dataset')\n",
    "        accs.append(main(args))\n",
    "    elif dataset == 'Coauthor-CS':\n",
    "        for i in range(3):\n",
    "            print('\\nstart testing on ' + dataset + ' dataset with random split: ' + str(i))\n",
    "            args.test_id = i\n",
    "            accs.append(main(args))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "accs = np.array(accs)\n",
    "np.savetxt('log_f1_macro/f1-macro_TreeLSTM_hop2.txt',accs)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
