{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_graph = []\n",
    "test_fact = []\n",
    "G1 = set()\n",
    "G2 = set()\n",
    "#../../GraIL-BM_fb237_v2/test/\n",
    "dataset = '.'\n",
    "relations_TG1 = set()\n",
    "relations_TG2 = set()\n",
    "relations_G1 = set()\n",
    "relations_G2 = set()\n",
    "for line in open('{}/test-graph.txt'.format(dataset)):\n",
    "    t = line.strip().split('\\t')\n",
    "    if t[1] != '<http://www.w3.org/1999/02/22-rdf-syntax-ns#type>':\n",
    "        test_graph.append(t)\n",
    "        if (t[0], t[1], t[2]) not in G1:\n",
    "            G1.add((t[0], t[1], t[2]))\n",
    "        if (t[0], t[1], t[2]) not in G2:\n",
    "            G2.add((t[0], t[1], t[2]))\n",
    "    if t[1] != '<http://www.w3.org/1999/02/22-rdf-syntax-ns#type>':\n",
    "        relations_TG1.add(t[1])\n",
    "        relations_G1.add(t[1])\n",
    "        relations_G2.add(t[1])\n",
    "for line in open('{}/test-fact.txt'.format(dataset)):\n",
    "    t = line.strip().split('\\t')\n",
    "    if t[1] != '<http://www.w3.org/1999/02/22-rdf-syntax-ns#type>':\n",
    "        test_fact.append(t)\n",
    "        if (t[0], t[1], t[2]) not in G2:\n",
    "            G2.add((t[0], t[1], t[2]))\n",
    "    if t[1] != '<http://www.w3.org/1999/02/22-rdf-syntax-ns#type>':\n",
    "        relations_TG2.add(t[1])\n",
    "        relations_G2.add(t[1])\n",
    "relations_TG1 = list(relations_TG1)\n",
    "relations_TG2 = list(relations_TG2)\n",
    "relations_G1 = list(relations_G1)\n",
    "relations_G2 = list(relations_G2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "pairs_for_relation_G1 = dict([(i,set()) for i in relations_G1])\n",
    "pairs_for_relation_G2 = dict([(i,set()) for i in relations_G2])\n",
    "for t in G1:\n",
    "    pairs_for_relation_G1[t[1]].add((t[0],t[2]))\n",
    "for t in G2:\n",
    "    pairs_for_relation_G2[t[1]].add((t[0],t[2]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "# subsumption of relations: R(x,y) --> S(x,y) confidence_subsumption[i][j] = j->i\n",
    "import numpy as np\n",
    "f = open('pattern1.txt',\"w+\")\n",
    "confidence_subsumption = np.zeros((len(relations_TG2), len(relations_TG1)))\n",
    "for i in range(len(relations_TG2)):\n",
    "    #print('\\rchecking {}-th relation'.format(str(i)),end='')\n",
    "    s = relations_TG2[i]\n",
    "    for j in range(len(relations_TG1)):\n",
    "        r = relations_TG1[j]\n",
    "        if s != r:\n",
    "            #computing N\n",
    "            N = len(pairs_for_relation_G1[r])\n",
    "            #print(pairs_for_relation_G1[r]) \n",
    "            M = 0\n",
    "            for pair in pairs_for_relation_G1[r]:\n",
    "                if pair in pairs_for_relation_G2[s]:\n",
    "                    M += 1\n",
    "\n",
    "            confidence_subsumption[i][j] = M / N\n",
    "            if confidence_subsumption[i][j] >= 0.2:\n",
    "                #print(r, s)\n",
    "                #print(M/N)\n",
    "                f.write('{}\\t{}\\t{}\\n'.format(str(M/N), r, s))\n",
    "f.close()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "checking 122-th relation0.3212590217590332\n",
      "concept:agentcreated concept:agentcreated\n",
      "1.0\n",
      "concept:stateorprovinceisborderedbystateorprovince concept:stateorprovinceisborderedbystateorprovince\n",
      "1.0\n"
     ]
    }
   ],
   "source": [
    "# transive relations: R(x,y), R(y,z) -> R(x,z) confidence_subsumption[i][i] = i -> i\n",
    "def compute_N(relation, G):\n",
    "    curr_N = 0\n",
    "    curr_XZ = set()\n",
    "    for p1 in pairs_for_relation_G1[relation]:\n",
    "        for p2 in pairs_for_relation_G1[relation]:\n",
    "            if p1 != p2:\n",
    "                if p1[1] == p2[0]:\n",
    "                    if (p1[0], p2[1]) not in curr_XZ:\n",
    "                        curr_N += 1\n",
    "                        curr_XZ.add((p1[0], p2[1]))\n",
    "    return curr_N, curr_XZ\n",
    "\n",
    "import time\n",
    "time1 = time.time()\n",
    "N_for_r = dict([(i,0) for i in relations_TG1])\n",
    "XZ_for_r = dict([(i,set()) for i in relations_TG1])\n",
    "i = 0 \n",
    "for r in relations_TG1:\n",
    "    i += 1\n",
    "    print('\\rchecking {}-th relation'.format(str(i)),end='')\n",
    "    N, XZ = compute_N(r, G1)\n",
    "    N_for_r[r] = N\n",
    "    XZ_for_r[r] = XZ\n",
    "print(time.time() - time1)\n",
    "\n",
    "# transive relations: R(x,y), R(y,z) -> R(x,z) confidence_subsumption[i][i] = i -> i\n",
    "import numpy as np\n",
    "f = open('pattern2.txt',\"w+\")\n",
    "confidence_subsumption = np.zeros((len(relations_TG2), len(relations_TG1)))\n",
    "for i in range(len(relations_TG2)):\n",
    "    #print('\\rchecking {}-th relation'.format(str(i)),end='')\n",
    "    s = relations_TG2[i]\n",
    "    for j in range(len(relations_TG1)):\n",
    "        r = relations_TG1[j]\n",
    "        if r == s:\n",
    "            #computing N\n",
    "            N = N_for_r[r]\n",
    "            XZ = XZ_for_r[r]\n",
    "            #print(pairs_for_relation_G1[r]) \n",
    "            M = 0\n",
    "            for pair in pairs_for_relation_G2[r]:\n",
    "                if pair in XZ:\n",
    "                    M += 1\n",
    "            if N == 0:\n",
    "                continue\n",
    "            confidence_subsumption[i][j] = M / N\n",
    "            \n",
    "            if confidence_subsumption[i][j] >= 0.5:\n",
    "                print(r, s)\n",
    "                print(M/N)\n",
    "                f.write('{}\\t{}\\t{}\\n'.format(str(M/N), r, s))\n",
    "f.close()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "# R(x,y) -> R(y,x)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "concept:mammalsuchasmammal\n",
      "0.7083333333333334\n",
      "concept:teamplaysagainstteam\n",
      "0.7717149220489977\n",
      "concept:competeswith\n",
      "0.7637795275590551\n",
      "concept:personalsoknownas\n",
      "1.0\n",
      "concept:arthropodcalledarthropod\n",
      "0.6351351351351351\n",
      "concept:animalsuchasinsect\n",
      "0.6255924170616114\n",
      "concept:animalpreyson\n",
      "0.5643835616438356\n",
      "concept:countryalsoknownas\n",
      "0.8950276243093923\n",
      "concept:agentcompeteswithagent\n",
      "0.5751633986928104\n",
      "concept:arthropodandotherarthropod\n",
      "0.6230366492146597\n",
      "concept:riveremptiesintoriver\n",
      "0.5\n"
     ]
    }
   ],
   "source": [
    "f = open('pattern3.txt',\"w+\")\n",
    "for i in range(len(relations_TG2)):\n",
    "    #print('\\rchecking {}-th relation'.format(str(i)),end='')\n",
    "    s = relations_TG2[i]\n",
    "    for j in range(len(relations_TG1)):\n",
    "        r = relations_TG1[j]\n",
    "        if s == r:\n",
    "            N = len(pairs_for_relation_G1[r])\n",
    "            #print(pairs_for_relation_G1[r]) \n",
    "            M = 0\n",
    "            for pair in pairs_for_relation_G1[r]:\n",
    "                if (pair[1], pair[0]) in pairs_for_relation_G2[s]:\n",
    "                    M += 1\n",
    "\n",
    "            confidence = M / N\n",
    "            if confidence >= 0.5:\n",
    "                print(r)\n",
    "                print(M/N)\n",
    "                f.write('{}\\t{}\\n'.format(str(confidence), r))\n",
    "f.close()            "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "checking 122-th relation5.008680820465088\n"
     ]
    }
   ],
   "source": [
    "rs_list = []\n",
    "for r in relations_TG1:\n",
    "    for s in relations_TG1:\n",
    "        rs_list.append((r,s))\n",
    "def compute_N_for_rs(r, s, G):\n",
    "    curr_N = 0\n",
    "    curr_XZ = set()\n",
    "    for p1 in pairs_for_relation_G1[r]:\n",
    "        for p2 in pairs_for_relation_G1[s]:\n",
    "            if p1[1] == p2[0]:\n",
    "                if (p1[0], p2[1]) not in curr_XZ:\n",
    "                    curr_N += 1\n",
    "                    curr_XZ.add((p1[0], p2[1]))\n",
    "    return curr_N, curr_XZ\n",
    "\n",
    "import time\n",
    "time1 = time.time()\n",
    "N_for_rs = dict([(i,0) for i in rs_list])\n",
    "XZ_for_rs = dict([(i,set()) for i in rs_list])\n",
    "i = 0 \n",
    "for r in relations_TG1:\n",
    "    i += 1\n",
    "    print('\\rchecking {}-th relation'.format(str(i)),end='')\n",
    "    for s in relations_TG1:\n",
    "        N, XZ = compute_N_for_rs(r, s, G1)\n",
    "        N_for_rs[(r,s)] = N\n",
    "        XZ_for_rs[(r,s)] = XZ\n",
    "print(time.time() - time1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "checking 86-th relation"
     ]
    }
   ],
   "source": [
    "# chains: R(x,y), S(y,z) -> T(x,z) \n",
    "import numpy as np\n",
    "f = open('pattern4',\"w+\")\n",
    "#confidence_subsumption = np.zeros((len(relations_TG2), len(relations_TG1)))\n",
    "for i in range(len(relations_TG2)):\n",
    "    print('\\rchecking {}-th relation'.format(str(i)),end='')\n",
    "    t = relations_TG2[i]\n",
    "    for j in range(len(relations_TG1)):\n",
    "        r = relations_TG1[j]\n",
    "        for k in range(len(relations_TG1)):\n",
    "            s = relations_TG1[k]\n",
    "            if r !=s and s!=t and r!=t:\n",
    "                #computing N\n",
    "                N = N_for_rs[(r,s)]\n",
    "                XZ = XZ_for_rs[(r,s)]\n",
    "                #print(pairs_for_relation_G1[r]) \n",
    "                M = 0\n",
    "                for pair in pairs_for_relation_G2[t]:\n",
    "                    if pair in XZ:\n",
    "                        M += 1\n",
    "                if N == 0:\n",
    "                    continue\n",
    "                confidence_subsumption[i][j] = M / N\n",
    "\n",
    "                if confidence_subsumption[i][j] >= 0.5:\n",
    "                    #print(s, r, t)\n",
    "                    #print(M/N)\n",
    "                    f.write('{}\\t{}\\t{}\\t{}\\n'.format(str(M/N), s,r,t))\n",
    "f.close()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "checking 122-th relation4.909570693969727\n"
     ]
    }
   ],
   "source": [
    "rs_list = []\n",
    "for r in relations_TG1:\n",
    "    for s in relations_TG1:\n",
    "        rs_list.append((r,s))\n",
    "def compute_N_for_rs_same(r, s, G):\n",
    "    curr_N = 0\n",
    "    curr_XY = set()\n",
    "    for p1 in pairs_for_relation_G1[r]:\n",
    "        for p2 in pairs_for_relation_G1[s]:\n",
    "            if p1[0] == p2[0]:\n",
    "                if p1[1] == p2[1]:\n",
    "                    if (p1[0], p1[1]) not in curr_XY:\n",
    "                        curr_N += 1\n",
    "                        curr_XY.add((p1[0], p1[1]))\n",
    "    return curr_N, curr_XY\n",
    "\n",
    "import time\n",
    "time1 = time.time()\n",
    "N_for_rs_same = dict([(i,0) for i in rs_list])\n",
    "XY_for_rs_same = dict([(i,set()) for i in rs_list])\n",
    "i = 0 \n",
    "for r in relations_TG1:\n",
    "    i += 1\n",
    "    print('\\rchecking {}-th relation'.format(str(i)),end='')\n",
    "    for s in relations_TG1:\n",
    "        N, XY = compute_N_for_rs_same(r, s, G1)\n",
    "        N_for_rs_same[(r,s)] = N\n",
    "        XY_for_rs_same[(r,s)] = XY\n",
    "print(time.time() - time1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "concept:synonymfor concept:animalsuchasinsect concept:arthropodcalledarthropod\n",
      "1.0\n",
      "concept:animalsuchasinsect concept:synonymfor concept:arthropodcalledarthropod\n",
      "1.0\n",
      "concept:animalthatfeedoninsect concept:synonymfor concept:arthropodcalledarthropod\n",
      "1.0\n",
      "concept:arthropodandotherarthropod concept:agentcompeteswithagent concept:arthropodcalledarthropod\n",
      "0.8333333333333334\n",
      "concept:agentcompeteswithagent concept:arthropodandotherarthropod concept:arthropodcalledarthropod\n",
      "0.8333333333333334\n",
      "concept:animalthatfeedoninsect concept:arthropodandotherarthropod concept:arthropodcalledarthropod\n",
      "0.5735294117647058\n",
      "concept:synonymfor concept:animalthatfeedoninsect concept:arthropodcalledarthropod\n",
      "1.0\n",
      "concept:arthropodandotherarthropod concept:animalthatfeedoninsect concept:arthropodcalledarthropod\n",
      "0.5735294117647058\n",
      "concept:mutualproxyfor concept:subpartof concept:atlocation\n",
      "0.6666666666666666\n",
      "concept:subpartof concept:mutualproxyfor concept:atlocation\n",
      "0.6666666666666666\n",
      "concept:synonymfor concept:arthropodcalledarthropod concept:animalsuchasinsect\n",
      "1.0\n",
      "concept:arthropodandotherarthropod concept:arthropodcalledarthropod concept:animalsuchasinsect\n",
      "0.6575342465753424\n",
      "concept:animalthatfeedoninsect concept:arthropodcalledarthropod concept:animalsuchasinsect\n",
      "0.9347826086956522\n",
      "concept:arthropodandotherarthropod concept:animalpreyson concept:animalsuchasinsect\n",
      "0.5238095238095238\n",
      "concept:arthropodcalledarthropod concept:synonymfor concept:animalsuchasinsect\n",
      "1.0\n",
      "concept:animalthatfeedoninsect concept:synonymfor concept:animalsuchasinsect\n",
      "1.0\n",
      "concept:arthropodcalledarthropod concept:arthropodandotherarthropod concept:animalsuchasinsect\n",
      "0.6575342465753424\n",
      "concept:animalpreyson concept:arthropodandotherarthropod concept:animalsuchasinsect\n",
      "0.5238095238095238\n",
      "concept:animalthatfeedoninsect concept:arthropodandotherarthropod concept:animalsuchasinsect\n",
      "0.8823529411764706\n",
      "concept:arthropodcalledarthropod concept:animalthatfeedoninsect concept:animalsuchasinsect\n",
      "0.9347826086956522\n",
      "concept:synonymfor concept:animalthatfeedoninsect concept:animalsuchasinsect\n",
      "1.0\n",
      "concept:arthropodandotherarthropod concept:animalthatfeedoninsect concept:animalsuchasinsect\n",
      "0.8823529411764706\n",
      "concept:animalsuchasinsect concept:specializationof concept:animalpreyson\n",
      "1.0\n",
      "concept:specializationof concept:animalsuchasinsect concept:animalpreyson\n",
      "1.0\n",
      "concept:animalsuchasinvertebrate concept:animalistypeofanimal concept:animalpreyson\n",
      "0.7142857142857143\n",
      "concept:animalistypeofanimal concept:animalsuchasinvertebrate concept:animalpreyson\n",
      "0.7142857142857143\n",
      "concept:athleteplaysforteam concept:worksfor concept:coachesteam\n",
      "1.0\n",
      "concept:worksfor concept:athleteplaysforteam concept:coachesteam\n",
      "1.0\n",
      "concept:animalpreyson concept:mammalsuchasmammal concept:animalistypeofanimal\n",
      "1.0\n",
      "concept:animalpreyson concept:specializationof concept:animalistypeofanimal\n",
      "0.7692307692307693\n",
      "concept:mammalsuchasmammal concept:animalpreyson concept:animalistypeofanimal\n",
      "1.0\n",
      "concept:specializationof concept:animalpreyson concept:animalistypeofanimal\n",
      "0.7692307692307693\n",
      "concept:mutualproxyfor concept:atlocation concept:subpartof\n",
      "1.0\n",
      "concept:proxyfor concept:atlocation concept:subpartof\n",
      "1.0\n",
      "concept:locationlocatedwithinlocation concept:citylocatedincountry concept:subpartof\n",
      "1.0\n",
      "concept:proxyfor concept:citylocatedincountry concept:subpartof\n",
      "1.0\n",
      "concept:atlocation concept:mutualproxyfor concept:subpartof\n",
      "1.0\n",
      "concept:citylocatedincountry concept:locationlocatedwithinlocation concept:subpartof\n",
      "1.0\n",
      "concept:atlocation concept:proxyfor concept:subpartof\n",
      "1.0\n",
      "concept:citylocatedincountry concept:proxyfor concept:subpartof\n",
      "1.0\n",
      "concept:proxyfor concept:personleadsorganization concept:worksfor\n",
      "1.0\n",
      "concept:athleteplaysforteam concept:coachesteam concept:worksfor\n",
      "1.0\n",
      "concept:athleteledsportsteam concept:coachesteam concept:worksfor\n",
      "1.0\n",
      "concept:personleadsgeopoliticalorganization concept:personhasresidenceingeopoliticallocation concept:worksfor\n",
      "1.0\n",
      "concept:personhasresidenceingeopoliticallocation concept:personleadsgeopoliticalorganization concept:worksfor\n",
      "1.0\n",
      "concept:coachesteam concept:athleteplaysforteam concept:worksfor\n",
      "1.0\n",
      "concept:personleadsorganization concept:proxyfor concept:worksfor\n",
      "1.0\n",
      "concept:coachesteam concept:athleteledsportsteam concept:worksfor\n",
      "1.0\n",
      "concept:animalsuchasinvertebrate concept:specializationof concept:agentcompeteswithagent\n",
      "1.0\n",
      "concept:specializationof concept:animalsuchasinvertebrate concept:agentcompeteswithagent\n",
      "1.0\n",
      "concept:organizationheadquarteredincity concept:newspaperincity concept:headquarteredin\n",
      "1.0\n",
      "concept:newspaperincity concept:organizationheadquarteredincity concept:headquarteredin\n",
      "1.0\n",
      "concept:animalsuchasinsect concept:arthropodcalledarthropod concept:arthropodandotherarthropod\n",
      "0.9090909090909091\n",
      "concept:synonymfor concept:arthropodcalledarthropod concept:arthropodandotherarthropod\n",
      "1.0\n",
      "concept:agentcompeteswithagent concept:arthropodcalledarthropod concept:arthropodandotherarthropod\n",
      "0.8333333333333334\n",
      "concept:animalthatfeedoninsect concept:arthropodcalledarthropod concept:arthropodandotherarthropod\n",
      "0.8913043478260869\n",
      "concept:arthropodcalledarthropod concept:animalsuchasinsect concept:arthropodandotherarthropod\n",
      "0.9090909090909091\n",
      "concept:animalpreyson concept:animalsuchasinsect concept:arthropodandotherarthropod\n",
      "0.65\n",
      "concept:synonymfor concept:animalsuchasinsect concept:arthropodandotherarthropod\n",
      "1.0\n",
      "concept:animalsuchasinvertebrate concept:animalsuchasinsect concept:arthropodandotherarthropod\n",
      "0.6363636363636364\n",
      "concept:animalthatfeedoninsect concept:animalsuchasinsect concept:arthropodandotherarthropod\n",
      "0.6310679611650486\n",
      "concept:animalsuchasinsect concept:animalpreyson concept:arthropodandotherarthropod\n",
      "0.65\n",
      "concept:arthropodcalledarthropod concept:synonymfor concept:arthropodandotherarthropod\n",
      "1.0\n",
      "concept:animalsuchasinsect concept:synonymfor concept:arthropodandotherarthropod\n",
      "1.0\n",
      "concept:animalthatfeedoninsect concept:synonymfor concept:arthropodandotherarthropod\n",
      "1.0\n",
      "concept:arthropodcalledarthropod concept:agentcompeteswithagent concept:arthropodandotherarthropod\n",
      "0.8333333333333334\n",
      "concept:animalsuchasinsect concept:animalsuchasinvertebrate concept:arthropodandotherarthropod\n",
      "0.6363636363636364\n",
      "concept:animalthatfeedoninsect concept:animalsuchasinvertebrate concept:arthropodandotherarthropod\n",
      "1.0\n",
      "concept:arthropodcalledarthropod concept:animalthatfeedoninsect concept:arthropodandotherarthropod\n",
      "0.8913043478260869\n",
      "concept:animalsuchasinsect concept:animalthatfeedoninsect concept:arthropodandotherarthropod\n",
      "0.6310679611650486\n",
      "concept:synonymfor concept:animalthatfeedoninsect concept:arthropodandotherarthropod\n",
      "1.0\n",
      "concept:animalsuchasinvertebrate concept:animalthatfeedoninsect concept:arthropodandotherarthropod\n",
      "1.0\n",
      "concept:subpartof concept:citylocatedincountry concept:citylocatedingeopoliticallocation\n",
      "1.0\n",
      "concept:locationlocatedwithinlocation concept:citylocatedincountry concept:citylocatedingeopoliticallocation\n",
      "1.0\n",
      "concept:proxyfor concept:citylocatedincountry concept:citylocatedingeopoliticallocation\n",
      "1.0\n",
      "concept:citylocatedincountry concept:subpartof concept:citylocatedingeopoliticallocation\n",
      "1.0\n",
      "concept:citylocatedincountry concept:locationlocatedwithinlocation concept:citylocatedingeopoliticallocation\n",
      "1.0\n",
      "concept:citylocatedincountry concept:proxyfor concept:citylocatedingeopoliticallocation\n",
      "1.0\n",
      "concept:agentbelongstoorganization concept:agentcontrols concept:agentcollaborateswithagent\n",
      "1.0\n",
      "concept:agentcontrols concept:agentbelongstoorganization concept:agentcollaborateswithagent\n",
      "1.0\n",
      "concept:animalsuchasinsect concept:arthropodcalledarthropod concept:animalthatfeedoninsect\n",
      "0.7454545454545455\n",
      "concept:synonymfor concept:arthropodcalledarthropod concept:animalthatfeedoninsect\n",
      "1.0\n",
      "concept:arthropodandotherarthropod concept:arthropodcalledarthropod concept:animalthatfeedoninsect\n",
      "0.5342465753424658\n",
      "concept:arthropodcalledarthropod concept:animalsuchasinsect concept:animalthatfeedoninsect\n",
      "0.7454545454545455\n",
      "concept:synonymfor concept:animalsuchasinsect concept:animalthatfeedoninsect\n",
      "1.0\n",
      "concept:arthropodandotherarthropod concept:animalsuchasinsect concept:animalthatfeedoninsect\n",
      "0.57\n",
      "concept:arthropodcalledarthropod concept:synonymfor concept:animalthatfeedoninsect\n",
      "1.0\n",
      "concept:animalsuchasinsect concept:synonymfor concept:animalthatfeedoninsect\n",
      "1.0\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "concept:arthropodcalledarthropod concept:arthropodandotherarthropod concept:animalthatfeedoninsect\n",
      "0.5342465753424658\n",
      "concept:animalsuchasinsect concept:arthropodandotherarthropod concept:animalthatfeedoninsect\n",
      "0.57\n",
      "concept:subpartof concept:citylocatedincountry concept:locationlocatedwithinlocation\n",
      "1.0\n",
      "concept:proxyfor concept:citylocatedincountry concept:locationlocatedwithinlocation\n",
      "1.0\n",
      "concept:citylocatedincountry concept:subpartof concept:locationlocatedwithinlocation\n",
      "1.0\n",
      "concept:citylocatedincountry concept:proxyfor concept:locationlocatedwithinlocation\n",
      "1.0\n",
      "concept:agentcollaborateswithagent concept:mutualproxyfor concept:agentcontrols\n",
      "1.0\n",
      "concept:mutualproxyfor concept:agentcollaborateswithagent concept:agentcontrols\n",
      "1.0\n",
      "concept:agentbelongstoorganization concept:agentcollaborateswithagent concept:agentcontrols\n",
      "1.0\n",
      "concept:agentcollaborateswithagent concept:agentbelongstoorganization concept:agentcontrols\n",
      "1.0\n",
      "concept:subpartof concept:citylocatedincountry concept:proxyfor\n",
      "1.0\n",
      "concept:locationlocatedwithinlocation concept:citylocatedincountry concept:proxyfor\n",
      "1.0\n",
      "concept:citylocatedincountry concept:subpartof concept:proxyfor\n",
      "1.0\n",
      "concept:locationlocatedwithinlocation concept:subpartof concept:proxyfor\n",
      "1.0\n",
      "concept:citylocatedincountry concept:locationlocatedwithinlocation concept:proxyfor\n",
      "1.0\n",
      "concept:subpartof concept:locationlocatedwithinlocation concept:proxyfor\n",
      "1.0\n"
     ]
    }
   ],
   "source": [
    "#R(x,y) , S(x,y) -> T(x,y)\n",
    "f = open('pattern5.txt',\"w+\")\n",
    "#confidence_subsumption = np.zeros((len(relations_TG2), len(relations_TG1)))\n",
    "for i in range(len(relations_TG2)):\n",
    "    #print('\\rchecking {}-th relation'.format(str(i)),end='')\n",
    "    t = relations_TG2[i]\n",
    "    for j in range(len(relations_TG1)):\n",
    "        r = relations_TG1[j]\n",
    "        for k in range(len(relations_TG1)):\n",
    "            \n",
    "                s = relations_TG1[k]\n",
    "                if s !=r and s != t and r != t:\n",
    "                    N = N_for_rs_same[(r,s)]\n",
    "                    XY = XY_for_rs_same[(r,s)]\n",
    "                    M = 0\n",
    "                    for pair in pairs_for_relation_G2[t]:\n",
    "                        if pair in XY:\n",
    "                            M += 1\n",
    "                        #print(pair)\n",
    "                    if N == 0:\n",
    "                        continue\n",
    "                    confidence_subsumption[i][j] = M / N\n",
    "\n",
    "                    if confidence_subsumption[i][j] > 0.5:\n",
    "                        print(s, r, t)\n",
    "                        print(M/N)\n",
    "                        f.write('{}\\t{}\\t{}\\t{}\\n'.format(str(M/N), s,r,t))\n",
    "f.close()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "types_G1 = set()\n",
    "types_G2 = set()\n",
    "types_TG1 = set()\n",
    "types_TG2 = set()\n",
    "G1_type_triples = set()\n",
    "G2_type_triples = set()\n",
    "for line in open('{}/test-graph.txt'.format(dataset)):\n",
    "    t = line.strip().split('\\t')\n",
    "    if t[1] == '<http://www.w3.org/1999/02/22-rdf-syntax-ns#type>':\n",
    "        types_G1.add(t[2])\n",
    "        #types_G2.add(t[2])\n",
    "        types_TG1.add(t[2])\n",
    "        G1_type_triples.add((t[0], t[1], t[2]))\n",
    "        #G2_type_triples.add((t[0], t[1], t[2]))\n",
    "for line in open('{}/test-fact.txt'.format(dataset)):\n",
    "    t = line.strip().split('\\t')\n",
    "    if t[1] == '<http://www.w3.org/1999/02/22-rdf-syntax-ns#type>':\n",
    "        types_G2.add(t[2])\n",
    "        types_TG2.add(t[2])\n",
    "        G2_type_triples.add((t[0], t[1], t[2]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "# A(x) -> B(x)\n",
    "#Type(a, A) -> Type(a, B)\n",
    "f = open('pattern6.txt',\"w+\")\n",
    "entities_for_type_G1 = dict([(i,set()) for i in types_G1])\n",
    "for t in G1_type_triples:\n",
    "    if t[1] == '<http://www.w3.org/1999/02/22-rdf-syntax-ns#type>':\n",
    "        entities_for_type_G1[t[2]].add(t[0])\n",
    "entities_for_type_G2 = dict([(i,set()) for i in types_G2])\n",
    "for t in G2_type_triples:\n",
    "    if t[1] == '<http://www.w3.org/1999/02/22-rdf-syntax-ns#type>':\n",
    "        entities_for_type_G2[t[2]].add(t[0])   \n",
    "for b in types_TG2:\n",
    "    \n",
    "    for a in types_TG1:\n",
    "        if a != b:\n",
    "            M = 0\n",
    "            N = len(entities_for_type_G1[a])\n",
    "            for entity in entities_for_type_G2[b]:\n",
    "                if entity in entities_for_type_G1[a]:\n",
    "                    M += 1\n",
    "            if N == 0:\n",
    "                    continue\n",
    "            if M/N > 0.5:\n",
    "                f.write('{}\\t{}\\t{}\\n'.format(str(M/N), a,b))\n",
    "f.close()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "# A1(x), A2(x) -> B(x)\n",
    "#Type(a, A) -> Type(a, B)\n",
    "f = open('pattern7.txt',\"w+\")\n",
    "entities_for_type_G1 = dict([(i,set()) for i in types_G1])\n",
    "for t in G1_type_triples:\n",
    "    if t[1] == '<http://www.w3.org/1999/02/22-rdf-syntax-ns#type>':\n",
    "        entities_for_type_G1[t[2]].add(t[0])\n",
    "entities_for_type_G2 = dict([(i,set()) for i in types_G2])\n",
    "for t in G2_type_triples:\n",
    "    if t[1] == '<http://www.w3.org/1999/02/22-rdf-syntax-ns#type>':\n",
    "        entities_for_type_G2[t[2]].add(t[0])   \n",
    "for b in types_TG2:\n",
    "    \n",
    "    for a1 in types_TG1:\n",
    "        for a2 in types_TG1:\n",
    "            if a1 != a2 and a1 != b and a2!=b:\n",
    "                M = 0\n",
    "                entities_a1_a2 = entities_for_type_G1[a1] & entities_for_type_G1[a2]\n",
    "                N = len(entities_a1_a2)\n",
    "                for entity in entities_for_type_G2[b]:\n",
    "                    if entity in entities_a1_a2:\n",
    "                        M += 1\n",
    "                if N == 0:\n",
    "                        continue\n",
    "                if M/N > 0.5:\n",
    "\n",
    "                    #print(a1, a2, b)\n",
    "                    #print(M/N)\n",
    "                    f.write('{}\\t{}\\t{}\\t{}\\n'.format(str(M/N), a1, a2, b))\n",
    "f.close()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [],
   "source": [
    "# R(x,y) -> A(x)\n",
    "f = open('pattern8.txt',\"w+\")\n",
    "for a in types_TG2:\n",
    "    for r in relations_TG1:\n",
    "        N = len(pairs_for_relation_G1[r])\n",
    "        print(N)\n",
    "        M = 0\n",
    "        for p in pairs_for_relation_G1[r]:\n",
    "            \n",
    "            if p[0] in entities_for_type_G2[a]:\n",
    "                M += 1\n",
    "                #print(a, r, p[0])\n",
    "        if M/N >= 0.1:\n",
    "            f.write('{}\\t{}\\n'.format(str(M/N), r,a))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [],
   "source": [
    "# R(x,y) -> A(y)\n",
    "f = open('pattern9.txt',\"w+\")\n",
    "for a in types_TG2:\n",
    "    for r in relations_TG1:\n",
    "        N = len(pairs_for_relation_G1[r])\n",
    "        #print(N)\n",
    "        M = 0\n",
    "        for p in pairs_for_relation_G1[r]:\n",
    "            \n",
    "            if p[1] in entities_for_type_G2[a]:\n",
    "                M += 1\n",
    "                #print(a, r, p[0])\n",
    "        if M/N >= 0.1:\n",
    "\n",
    "            print(r, a)\n",
    "            print(M/N)\n",
    "            f.write('{}\\t{}\\n'.format(str(M/N), r,a))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [],
   "source": [
    "# R(x,y) -> A(x)\n",
    "f = open('pattern10.txt',\"w+\")\n",
    "for a in types_TG2:\n",
    "    for r in relations_TG1:\n",
    "        N = len(pairs_for_relation_G1[r])\n",
    "        #print(N)\n",
    "        M = 0\n",
    "        for p in pairs_for_relation_G1[r]:\n",
    "            \n",
    "            if p[0] in entities_for_type_G2[a]:\n",
    "                M += 1\n",
    "                #print(a, r, p[0])\n",
    "        #if M != 0:\n",
    "            #print(M)\n",
    "        if M/N >= 0.05:\n",
    "\n",
    "            print(r, a)\n",
    "            print(M/N)\n",
    "            f.write('{}\\t{}\\n'.format(str(M/N), r,a))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.6.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
