{
 "cells": [
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-08-04T16:43:23.505438Z",
     "start_time": "2024-08-04T16:43:22.990159Z"
    }
   },
   "cell_type": "code",
   "source": [
    "import editdistance\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "\n",
    "from src.evaluation.longest_common_subsequence import get_longest_common_word_subsequence_length"
   ],
   "id": "103fa92a4a702497",
   "outputs": [],
   "execution_count": 1
  },
  {
   "metadata": {},
   "cell_type": "markdown",
   "source": "## Bongard AVR",
   "id": "8ca23f68d6404cf3"
  },
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-07-27T14:45:59.815604Z",
     "start_time": "2024-07-27T14:45:59.803147Z"
    }
   },
   "cell_type": "code",
   "source": [
    "rules = pd.read_csv(\"../data/raw/labels.csv\")[[\"Left-side Rule\", \"Right-side Rule\"]].values\n",
    "rules"
   ],
   "id": "e29e37049fbeec6e",
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([['Empty picture', 'Not empty picture'],\n",
       "       ['Large figures', 'Small figures'],\n",
       "       ['Outline figures', 'Solid figures'],\n",
       "       ['Convex figures', 'Nonconvex figures'],\n",
       "       ['Polygons', 'Curvilinear figures'],\n",
       "       ['Triangles', 'Quadrangles'],\n",
       "       ['Figures elongated vertically', 'Figures elongated horizontally'],\n",
       "       ['Figures on the right side', 'Figures on the left side'],\n",
       "       ['Smooth contour figures', 'Twisting contour figures'],\n",
       "       ['Triangles', 'Quadrangles'],\n",
       "       ['Elongated figures', 'Compact figures'],\n",
       "       ['Convex hull of figure elongated',\n",
       "        'Convex hull of figure compact'],\n",
       "       ['Vertical rectangles or horizontal ellipses',\n",
       "        'Vertical ellipses or horizontal rectangles'],\n",
       "       ['Large total line length', 'Small total line length'],\n",
       "       ['Closed lines', 'Open lines'],\n",
       "       ['Spiral curls counterclockwise', 'Spiral curls clockwise'],\n",
       "       ['An acute angle directed inward', 'No angle directed inward'],\n",
       "       ['A neck', 'No neck'],\n",
       "       ['Neck horizontal', 'Neck vertical'],\n",
       "       ['Points located on one side of the neck',\n",
       "        'Points located on both sides of the neck'],\n",
       "       ['Small figure present', 'No small figure present'],\n",
       "       ['Areas of figures approximately equal',\n",
       "        'Areas of figures differ greatly'],\n",
       "       ['One figure', 'Two figures'],\n",
       "       ['A circle', 'No circle'],\n",
       "       ['Black figure is a triangle', 'Black figure is a circle'],\n",
       "       ['Solid black triangle', 'No solid black triangle'],\n",
       "       ['More solid black figures', 'More outline figures'],\n",
       "       ['More solid black circles', 'More outline circles'],\n",
       "       ['There are more small circles inside the figure outline than outside',\n",
       "        'There are fewer small circles inside the figure outline than outside'],\n",
       "       ['A line with a self-crossing', 'A line without a self-crossing'],\n",
       "       ['One line', 'Two lines'],\n",
       "       ['A sharp projection', 'No sharp projection'],\n",
       "       ['Acute angle', 'No acute angle'],\n",
       "       ['A large hole', 'A small hole'],\n",
       "       ['The axis of the hole is parallel to the figure axis',\n",
       "        'The axis of the hole is perpendicular to the figure axis'],\n",
       "       ['Triangle above circle', 'Circle above triangle'],\n",
       "       ['Triangle above circle', 'Circle above triangle'],\n",
       "       ['Triangle larger than circle', 'Triangle smaller than circle'],\n",
       "       ['Segments almost parallel to each other',\n",
       "        'Large angles between segments'],\n",
       "       ['Three points on a straight line',\n",
       "        'No three points on a straight line'],\n",
       "       ['Outline circles on one straight line',\n",
       "        'Outline circles not on one straight line'],\n",
       "       ['Points inside the figure outline are on a straight line',\n",
       "        'Points inside the figure outline are not on a straight line'],\n",
       "       ['The vibration amplitude increases from left to right',\n",
       "        'The vibration amplitude decreases from left to right'],\n",
       "       ['Small circles on different arcs', 'Small circles on one arc'],\n",
       "       ['Outline figure on top of solid black figure',\n",
       "        'Black figure on top of outline figure'],\n",
       "       ['Triangle on top of the circle', 'Circle on top of the triangle'],\n",
       "       ['Triangle inside of the circle', 'Circle inside of the triangle'],\n",
       "       ['Solid dark figures above the outline figures',\n",
       "        'Outline figures above the solid dark figures'],\n",
       "       ['Points inside the figure outline are grouped more densely than outside the contour',\n",
       "        'Points outside the figure contour are grouped more densely than inside the contour'],\n",
       "       ['Axes of symmetry', 'No axes of symmetry'],\n",
       "       ['Two circles close to each other',\n",
       "        'No two circles close to each other'],\n",
       "       ['Arrows pointing in different directions',\n",
       "        'Arrows pointing in the same direction'],\n",
       "       ['Inside figure has fewer angles than outside figure',\n",
       "        'Inside figure has more angles than outside figure'],\n",
       "       ['A cross, circle, and triangle arranged counterclockwise',\n",
       "        'A cross, circle, and triangle arranged clockwise'],\n",
       "       ['A circle is at the left of the cavity if you look from inside the figure',\n",
       "        'A circle is at the right of the cavity if you look from inside the figure'],\n",
       "       ['All figures of the same color', 'Figures of different colors'],\n",
       "       ['Identical figures', 'Figures not identical'],\n",
       "       ['Solid dark quadrangles are identical',\n",
       "        'Solid dark quadrangles are different'],\n",
       "       ['Figures are similar', 'Figures are not similar'],\n",
       "       ['Some similar figures', 'No similar figures'],\n",
       "       ['A line separates the crosses in half',\n",
       "        'A line does not separate the crosses in half'],\n",
       "       ['Ends of the curve are far apart',\n",
       "        'Ends of the curve are close together'],\n",
       "       ['Shading thicker on the right side',\n",
       "        'Shading thicker on the left side'],\n",
       "       ['A cross is located on the extension of the ellipse axis',\n",
       "        'A circle is located on the extension of the ellipse axis'],\n",
       "       ['A set of triangles elongated horizontally',\n",
       "        'A set of triangles elongated vertically'],\n",
       "       ['Unconnected circles on a horizontal line',\n",
       "        'Unconnected circles on a vertical line'],\n",
       "       ['The right branch begins at a higher point than the left branch',\n",
       "        'The right branch begins at a lower point than the left branch'],\n",
       "       ['The end of the right branch is higher than that of the left branch',\n",
       "        'The end of the right branch is lower than that of the left branch'],\n",
       "       ['Large black dot on the main branch',\n",
       "        'Large black dot on a side branch'],\n",
       "       ['There are no side branches of the second order',\n",
       "        'There are side branches of the second order'],\n",
       "       ['There are inside figures of the second order',\n",
       "        'There are no inside figures of the second order'],\n",
       "       ['Ends of the curve are parallel',\n",
       "        'Ends of the curve are perpendicular'],\n",
       "       ['The long axes of the ellipse and rectangle are perpendicular',\n",
       "        'The long axes of the ellipse and rectangle are parallel'],\n",
       "       ['A tail grows from the obtuse end',\n",
       "        'A tail grows from the acute end'],\n",
       "       ['Triangle located at the concave side of an arc',\n",
       "        'Triangle located at the convex side of an arc'],\n",
       "       ['Long sides concave', 'Long sides convex'],\n",
       "       ['Angle divided in half', 'Angle not divided in half'],\n",
       "       ['Extensions of segments cross at one point',\n",
       "        'Extensions of segments do not cross at one point'],\n",
       "       ['A dark circle is closer to the outline circle than to the triangle',\n",
       "        'A dark circle is closer to the triangle than to the outline circle'],\n",
       "       ['Points located at the same distances from a cross',\n",
       "        'Points located at different distances from a cross'],\n",
       "       ['Dark figures can be divided from outline figures by a straight line  alternatively:  Convex hulls of filled and outlined figures overlap',\n",
       "        'Dark figures are impossible to separate  alternatively:  Convex hulls of filled and outlined figures do not overlap'],\n",
       "       ['The convex hull of the crosses forms an equilateral triangle',\n",
       "        'The convex hull of the crosses does not form an equilateral triangle'],\n",
       "       ['A circle is inside of a figure made by crosses',\n",
       "        'A circle is outside of a figure made by crosses'],\n",
       "       ['A quadrangle is outside of a figure made by circles',\n",
       "        'A quadrangle is inside of a figure made by circles'],\n",
       "       ['Three parts', 'Five parts'],\n",
       "       ['Three parts', 'Five parts'],\n",
       "       ['Four parts', 'Five parts'],\n",
       "       ['Three parts', 'Five parts'],\n",
       "       ['Three parts', 'Five parts'],\n",
       "       ['Three parts', 'Four parts'],\n",
       "       ['Three identical elements', 'Four identical elements'],\n",
       "       ['The chain does not branch', 'The chain branches'],\n",
       "       ['Branches at outlined circle', 'Branches at solid dark circle'],\n",
       "       ['Solid dark circle not at end', 'Solid dark circle at end'],\n",
       "       ['Vertical hatched lines', 'Horizontal hatched lines'],\n",
       "       ['Triangles', 'Quadrangles'],\n",
       "       ['Triangles', 'Circles'],\n",
       "       ['Triangles', 'Quadrangles'],\n",
       "       ['Outlines made by triangles and circles intersect',\n",
       "        'Outlines made by triangles and circles do not intersect'],\n",
       "       ['The letter А', 'The letter Б'],\n",
       "       ['Parallel dents', 'Perpendicular dents'],\n",
       "       ['Internal arrows point outward', 'Internal arrows point inward'],\n",
       "       ['Isosceles triangle', 'Scalene triangle'],\n",
       "       ['One circle passes through the center of the other circle',\n",
       "        'No circle passes through the center of the other circle'],\n",
       "       ['Ends of line point to the same direction',\n",
       "        'Ends of line point to opposite directions'],\n",
       "       ['Negative slope', 'Positive slope'],\n",
       "       ['Three simple lines', 'Three complex lines'],\n",
       "       ['Petals taper off', 'Petals thicken'],\n",
       "       ['Circle on the right of the box',\n",
       "        'Circle on the left of the box'],\n",
       "       ['Four out of five objects are circles',\n",
       "        'Never four out of five objects are circles'],\n",
       "       ['Middle shape is a triangle', 'Middle shape is not a triangle'],\n",
       "       ['X-coordinates of dots are equidistant',\n",
       "        'Y-coordinates of dots are equidistant'],\n",
       "       ['T-like junction', 'Y-like junction'],\n",
       "       ['Four X-like points', 'Two X-like points'],\n",
       "       ['Innermost shape is reachable from the outermost one',\n",
       "        'Innermost shape is unreachable from the outermost one'],\n",
       "       ['Polygon stands on side', 'Polygon stands on vertex'],\n",
       "       ['Triangle points to center of circle',\n",
       "        'Triangle does not point to center of circle'],\n",
       "       ['No cycle', 'A cycle exists'],\n",
       "       ['A small correction will result into a single circle',\n",
       "        'No small correction will result into a single circle'],\n",
       "       ['All turns are in one direction  alternatively:  Rectangular loop exists',\n",
       "        'Turns are not all in one direction  alternatively:  No rectangular loop'],\n",
       "       ['Circle: VV; square: VΛ; triangle: ΛΛ; blank: ΛV',\n",
       "        'Circle: ΛΛ; square:  ΛV; triangle: VV; blank: VΛ'],\n",
       "       ['Line divides interior into two regions', 'Not so'],\n",
       "       ['Similar shapes', 'Dissimilar shapes'],\n",
       "       ['Similar textures', 'Dissimilar textures'],\n",
       "       ['One protrusion and one indentation of the same shape', 'Not so'],\n",
       "       ['One large and one small object', 'Not so'],\n",
       "       ['Exactly one circle', 'Not exactly one circle'],\n",
       "       ['Same objects inside and outside the large shape',\n",
       "        'Not same objects inside and outside the large shape'],\n",
       "       ['Indentation on protrusion', 'Indentation on indentation'],\n",
       "       ['Closed region is made of curves if “flaws” are ignored',\n",
       "        'Closed region is a polygon if “flaws” are ignored'],\n",
       "       ['Dots are vertices of a parallelogram',\n",
       "        'Dots are not vertices of a parallelogram'],\n",
       "       ['Dots are vertices of a triangle standing on a side',\n",
       "        'Dots are vertices of a triangle standing on a vertex'],\n",
       "       ['Dots collinear with center of circle',\n",
       "        'Dots not collinear with center of circle'],\n",
       "       ['Circle centers are collinear',\n",
       "        'Circle centers are not collinear'],\n",
       "       ['Circles on same side of curve',\n",
       "        'Circles on different sides of curves'],\n",
       "       ['Concave shape', 'Convex shape'],\n",
       "       ['Dots equal in number to the sides of the closed region',\n",
       "        'Dots unequal in number to the sides of the closed region'],\n",
       "       ['No dot well within the convex hull',\n",
       "        'At least one dot well within the convex hull'],\n",
       "       ['Similar components that change regularly', 'Not so'],\n",
       "       ['One large shape and two smaller identical ones', 'Not so'],\n",
       "       ['Two clusters of three and two objects each',\n",
       "        'One cluster of three objects and two different objects'],\n",
       "       ['Two clusters of three and two that are adjacent',\n",
       "        'Two clusters of three and two that are not adjacent'],\n",
       "       ['Two clusters of three and two', 'Two clusters of four and one'],\n",
       "       ['Two clusters of three and two but sharing a property  alternatively:  Different features yield different 3-2 splits',\n",
       "        'Two clusters of three and two, separable  alternatively:  Different features yield the same 3-2 split'],\n",
       "       ['Two clusters of four and one, the four are of same kind  alternatively:  Different features yield same 4-1 split',\n",
       "        'Two clusters of four and one, the four are three and one  alternatively:  Different features yield different 4-1 splits'],\n",
       "       ['A shape contains a square if and only if it is a circle',\n",
       "        'A shape contains a square if and only if it is a triangle'],\n",
       "       ['Two clusters of three and two, the two are vertical',\n",
       "        'Two clusters of three and two, the two are horizontal'],\n",
       "       ['A little less than a regular shape',\n",
       "        'A little more than a regular shape'],\n",
       "       ['Lone square', 'Lone circle'],\n",
       "       ['Odd number of squares', 'Even number of squares'],\n",
       "       ['If the circle closest to the cross is removed, the rest form an equilateral triangle',\n",
       "        'Not so'],\n",
       "       ['No vertical axis of symmetry', 'Vertical axis of symmetry'],\n",
       "       ['Predominance of curves and hook-like endings',\n",
       "        'Predominance of straight lines and staple-like endings'],\n",
       "       ['Wedged endings', 'Rounded endings'],\n",
       "       ['Curves are longer than straight lines',\n",
       "        'Curves are shorter than straight lines'],\n",
       "       ['Three spatially separated clusters',\n",
       "        'Two spatially separated clusters'],\n",
       "       ['White background', 'Black background'],\n",
       "       ['Some slope', 'Another slope'],\n",
       "       ['Two clusters of 2+3, middle shape must be seen as rectangle',\n",
       "        'Two clusters of 2+3, middle shape must be seen as piece of straight line'],\n",
       "       ['Quadrilateral that is nearly a triangle',\n",
       "        'Typical quadrilateral'],\n",
       "       ['Midpoints are collinear', 'Midpoints are not collinear'],\n",
       "       ['Every other side, if extended, passes through one point',\n",
       "        'Not so'],\n",
       "       ['Line connecting small shapes does not intersect large one',\n",
       "        'Line connecting small shapes intersects large one'],\n",
       "       ['Number of objects is one less than sides',\n",
       "        'Number of objects is one more than sides'],\n",
       "       ['Line perpendicular to one side of the object',\n",
       "        'Line parallel to one side of the object'],\n",
       "       ['Two clusters of dots', 'Three clusters of dots'],\n",
       "       ['Every cluster has two clusters of dots',\n",
       "        'Every cluster has three clusters of dots'],\n",
       "       ['Bulky interior, if closed', 'Narrow interior, if closed'],\n",
       "       ['Two clusters of different numbers of elements',\n",
       "        'Two clusters of equal number of elements'],\n",
       "       ['Π-like shape', 'X-like shape'],\n",
       "       ['Angle bisectors meet at the incenter',\n",
       "        'Perpendicular bisectors meet at the orthocenter'],\n",
       "       ['Radially symmetric', 'Not radially symmetric'],\n",
       "       ['Small variance of slopes', 'Large variance of slopes'],\n",
       "       ['Convex central interior', 'Concave central interior'],\n",
       "       ['Small object can glide in the bay',\n",
       "        'Small object cannot glide in the bay'],\n",
       "       ['Line that connects dots avoiding obstacles is short',\n",
       "        'Line that connects dots avoiding obstacles is long'],\n",
       "       ['All interiors are convex', 'At least one concave interior'],\n",
       "       ['Center of circle in triangle perpendicular to the other two',\n",
       "        'Not so'],\n",
       "       ['Object thinner at top', 'Object thicker at top'],\n",
       "       ['Black region narrows at the boundary or black/white',\n",
       "        'Black region widens at the boundary or black/white'],\n",
       "       ['One concavity', 'Two concavities'],\n",
       "       ['Concave if proximal points are connected',\n",
       "        'Convex if proximal points are connected'],\n",
       "       ['Same curvature close to the middle  alternative expression of the same idea:  Tangent near the middle leaves curve on the same side',\n",
       "        'Change of curvature close to the middle  alternative expression of the same idea:  Tangent near the middle leaves curve on opposite sides'],\n",
       "       ['Curve is smooth close to the middle',\n",
       "        'Curve zigzags close to the middle'],\n",
       "       ['Curve with two complex parts', 'Curve with three complex parts'],\n",
       "       ['Object made of objects',\n",
       "        'Object made of objects made of objects'],\n",
       "       ['Sides of parts are one more than sides of whole',\n",
       "        'Sides of parts are one less than sides of whole'],\n",
       "       ['Shape of whole different from shape of parts',\n",
       "        'Shape of whole same as shape of parts'],\n",
       "       ['All clusters are made of objects of the same texture',\n",
       "        'Not all clusters are made of objects of the same texture'],\n",
       "       ['All connected objects have the same texture',\n",
       "        'Some connected objects have different textures'],\n",
       "       ['Orifice on the left', 'Orifice on the right'],\n",
       "       ['Elongated vertically', 'Elongated horizontally'],\n",
       "       ['“Ghost” triangle', '“Ghost” rectangle'],\n",
       "       ['Background is a parallelogram', 'Background is a triangle'],\n",
       "       ['Bottom object in front of top objects in 3-D',\n",
       "        'Bottom object behind top objects in 3-D'],\n",
       "       ['Light-colored texture', 'Dark-colored texture'],\n",
       "       ['Some style (font)', 'Another style (font)'],\n",
       "       ['Stays in  alternative lower-level expression of the same idea:  One end of the chain is inside the large shape',\n",
       "        'Escapes  alternative lower-level expression of the same idea:  Both ends of the chain are outside the large shape'],\n",
       "       ['Stays put  alternative lower-level expression of the same idea:  Vertical from barycenter intersects the base of the object',\n",
       "        'Tumbles  alternative lower-level expression of the same idea:  Vertical from barycenter avoids the base of the object'],\n",
       "       ['Bongard Problem with solution based on features',\n",
       "        'Bongard Problem with solution based on numerosity'],\n",
       "       ['Two of the shapes make tiles along their border lines',\n",
       "        'Not so'],\n",
       "       ['Even number', 'Odd number'],\n",
       "       ['Prime number', 'Composite number'],\n",
       "       ['Five', 'Four'],\n",
       "       ['Two clusters of two elements each', 'Not so'],\n",
       "       ['Curve ends in a roughly up or down direction',\n",
       "        'Curve ends in a roughly left or right direction'],\n",
       "       ['Curve ends on the left part of the box',\n",
       "        'Curve ends on the right part of the box'],\n",
       "       ['All curves spiral counterclockwise, starting from maximum curvature',\n",
       "        'All curves spiral clockwise, starting from maximum curvature'],\n",
       "       ['No objects are centered at the center of the box',\n",
       "        'One object is centered at the center of the box'],\n",
       "       ['Part of at least one object is out of box',\n",
       "        'All objects are within the box'],\n",
       "       ['More black than white', 'More white than black'],\n",
       "       ['No dot is too far apart from another dot',\n",
       "        'At least one dot is far apart from all other dots'],\n",
       "       ['Curve intersects itself at the point of greatest curvature',\n",
       "        'Not so'],\n",
       "       ['“Smiley face”', 'Not a \"smiley face”'],\n",
       "       ['“Mouth” concave upwards', '“Mouth” convex upwards'],\n",
       "       ['“Ink tip” (non-homogeneous line)',\n",
       "        '“Marker tip” (homogeneous line)'],\n",
       "       ['Perfectly drawn lines', 'Imperfectly drawn lines'],\n",
       "       ['Something is missing in the sequence',\n",
       "        'Nothing is missing in the sequence'],\n",
       "       ['Parallel curves', 'Non-parallel curves'],\n",
       "       ['One cluster', 'Two clusters'],\n",
       "       ['No small square at the end of any curve  alternatively:  Curves with a 3-D feeling',\n",
       "        'Curve ends at a small square  alternatively:  Flat (2-D) curves'],\n",
       "       ['Border of black rectangle is incomplete',\n",
       "        'Border of black rectangle is complete'],\n",
       "       ['Large black region if completed is a circle',\n",
       "        'Large black region if completed is an ellipse'],\n",
       "       ['Diametrically opposite objects affect similarly the large black circular region',\n",
       "        'Not so'],\n",
       "       ['Low contrast  alternative lower-level expression of the same idea:  No fully black region',\n",
       "        'High contrast  alternative lower-level expression of the same idea:  At least one fully black region'],\n",
       "       ['What comes out of black circle has a clockwise direction',\n",
       "        'Not so'],\n",
       "       ['Dots touch each other if and only if no large region touches the edges of the box',\n",
       "        'Dots don’t touch each other if and only if no large region touches the edges of the box'],\n",
       "       ['After rotating so that the longest line is horizontal, there is a “left arm” raised and a “weight” down',\n",
       "        'After rotating so that the longest line is horizontal, there is a “left arm” down and a “weight” raised'],\n",
       "       ['When the objects are rotated and their dots are overlapped and eliminated, they form three-square-tall structures with columns of the same color',\n",
       "        'Not so'],\n",
       "       ['Explanation / justification of BP#229 by its creator:  Long (doubly sized) objects are purines (A & G).  Short objects are pyrimidines (C & T).  Black are those forming triple Hbond (G and C).  White are those forming double Hbond (A & T).  On the left we have “matching codes”, i.e., bases, doublets or triplets that, when rotated, can pair correctly (A with T, G with C), binding the two “strands”.  On the right we have objects that no matter how they are rotated they do not pair correctly (because of bumps, wrong color codes, etc).',\n",
       "        'Explanation / justification of BP#229 by its creator:  Long (doubly sized) objects are purines (A & G).  Short objects are pyrimidines (C & T).  Black are those forming triple Hbond (G and C).  White are those forming double Hbond (A & T).  On the left we have “matching codes”, i.e., bases, doublets or triplets that, when rotated, can pair correctly (A with T, G with C), binding the two “strands”.  On the right we have objects that no matter how they are rotated they do not pair correctly (because of bumps, wrong color codes, etc).'],\n",
       "       ['The sum of vertices, line ends, and dots is 7', 'Not so'],\n",
       "       ['Five concavities', 'Not five concavities'],\n",
       "       ['Box divided into six areas', 'Box divided into four areas'],\n",
       "       ['Lines plus triangles equal stars',\n",
       "        'Lines minus triangles equal stars'],\n",
       "       ['Circle falls by gravity on the right half of box if let loose',\n",
       "        'Circle falls by gravity on the left half of box if let loose'],\n",
       "       ['The “rope”, if extended, reaches the other ball',\n",
       "        'The “rope”, if extended, does not reach the other ball'],\n",
       "       ['Texture with stripy squiggle', 'Texture with blotchy squiggle'],\n",
       "       ['Upper central line appears shorter than lower central line',\n",
       "        'Upper central line appears longer than lower central line'],\n",
       "       ['C-like curves point to the same direction',\n",
       "        'C-like curves point to opposite directions'],\n",
       "       ['Straight line parallel to line joining the ends of curve  alternatively:  Sliding the straight line suitably can make a closed area',\n",
       "        'Straight line perpendicular to line joining the ends of curve  alternatively:  Not so'],\n",
       "       ['Straight line joining the curve ends does not cut the curve',\n",
       "        'Straight line joining the curve ends intersects the curve'],\n",
       "       ['Circumference shorter than length of everything else',\n",
       "        'Circumference longer than length of everything else'],\n",
       "       ['Convex hull is a square', 'Convex hull is not a square'],\n",
       "       ['Triangle closer to box corner than any of the circles',\n",
       "        'Not so'],\n",
       "       ['Scanning left-to-right, top-to-bottom, each filled box is separated from the next filled box by the same number of empty boxes',\n",
       "        'Not so'],\n",
       "       ['Can be completed to be made into a rectangle',\n",
       "        'Cannot be completed to be made into a rectangle'],\n",
       "       ['Equal numbers of straight lines and continuous curves',\n",
       "        'Unequal numbers of straight lines and continuous curves'],\n",
       "       ['Five straight or curved lines',\n",
       "        'Not five straight or curved lines'],\n",
       "       ['Dashed lines inside solid shape make an identical but slightly smaller shape, “parallel” to the one outside',\n",
       "        'Not so'],\n",
       "       ['Dashed lines form the same shape centered inside', 'Not so'],\n",
       "       ['Tetrahedron projected on the box plane  alternative lower-level expression of the same idea:  Four points interconnected with straight lines where one of the points might lie on an edge',\n",
       "        'Not so'],\n",
       "       ['Tetrahedron projected on the box plane', 'Not so'],\n",
       "       ['Impossible solid in 3-D', 'Possible solid in 3-D'],\n",
       "       ['Prime number  solution without using the arithmetic concept of primality:  It is impossible to create subgroups all of which have the same number of two-or-more identically shaped objects',\n",
       "        'Composite number  solution without using the arithmetic concept of primality:  It is possible to create subgroups all of which have the same number of two-or-more identically shaped objects'],\n",
       "       ['Circle and two vertices are collinear',\n",
       "        'No two vertices and the circle are collinear'],\n",
       "       ['Three pairs of parallel and non-collinear pieces of straight lines, each pair with a different slope',\n",
       "        'Not so'],\n",
       "       ['Each large circle closer to a small circle than a large one, and each small circle closer to a large one than a small one',\n",
       "        'Not so'],\n",
       "       ['The distance from the center of the line to the bottom of the square is the same as the distance from the dot to the right edge of the square',\n",
       "        'Not so'],\n",
       "       ['Objects identical after mirroring horizontally',\n",
       "        'Objects identical after mirroring vertically'],\n",
       "       ['Two identical overlapping objects of which the top is rotated slightly clockwise',\n",
       "        'Not so'],\n",
       "       ['Squares are either all empty or all contain something',\n",
       "        'Not so'],\n",
       "       ['Straight lines that join filled and outlined circles intersect',\n",
       "        'Straight lines that join filled and outlined circles do not intersect'],\n",
       "       ['Exactly one point where lines bend at an angle',\n",
       "        'Not exactly one point where lines bend at an angle'],\n",
       "       ['At least one ending edge is straight',\n",
       "        'All ending edges are curved'],\n",
       "       ['Closed area', 'No closed area'],\n",
       "       ['Axis of symmetry', 'No axis of symmetry'],\n",
       "       ['At least one touch or cross point', 'No touch or cross point'],\n",
       "       ['Odd number of straight line segments',\n",
       "        'Even number of straight line segments'],\n",
       "       ['Convex hull elongated vertically',\n",
       "        'Convex hull elongated horizontally'],\n",
       "       ['Center of symmetry', 'No center of symmetry'],\n",
       "       ['Only vertical or horizontal lines',\n",
       "        'Neither vertical nor horizontal lines'],\n",
       "       ['Can be hand-written without raising the pen',\n",
       "        'Cannot be hand-written without raising the pen'],\n",
       "       ['Convex hull is a triangle', 'Convex hull is a quadrilateral'],\n",
       "       ['Stays put', 'Tumbles'],\n",
       "       ['Notch from above (holds poured water)',\n",
       "        'No notch from above (does not hold poured water)'],\n",
       "       ['Straight line joining the ends does not intersect the object',\n",
       "        'Straight line joining the ends intersects the object'],\n",
       "       ['At least one endpoint', 'No endpoints'],\n",
       "       ['One object', 'Two or more objects'],\n",
       "       ['Shorter on the left, taller on the right',\n",
       "        'Taller on the left, shorter on the right'],\n",
       "       ['The left part has more pixels than the right part',\n",
       "        'The left part has fewer pixels than the right part'],\n",
       "       ['The left part is wider than the right part',\n",
       "        'The left part is narrower than the right part'],\n",
       "       ['Equal number of horizontal and vertical lines',\n",
       "        'Unequal number of horizontal and vertical lines'],\n",
       "       ['Shape of black region same as overall shape of object',\n",
       "        'Shape of black region different from overall shape of object'],\n",
       "       ['Rectangle left after tiling all black shapes into empty square',\n",
       "        'Triangle left after tiling all black shapes into empty square'],\n",
       "       ['Half of the square is filled',\n",
       "        'Either more or less than half of the square is filled'],\n",
       "       ['The centers (“barycenters”) of the objects are collinear',\n",
       "        'The centers (“barycenters”) of the objects are not collinear'],\n",
       "       ['Decreasing in size from top to bottom',\n",
       "        'Increasing in size from top to bottom'],\n",
       "       ['“Rays” emanating from a central point  alternative lower-level expression of the same idea:  Altitudes of isosceles triangles meet at a point if extended from top to base',\n",
       "        'Not so'],\n",
       "       ['The sum of the ratios of the filled areas is 1',\n",
       "        'The sum of the ratios of the filled areas is other than 1'],\n",
       "       ['Shapes, if tiled up properly, form a square',\n",
       "        'Shapes cannot form a square no matter how they are tiled'],\n",
       "       ['If any non-nosed faces exist, they are happy if and only if happy nosed faces exist as well',\n",
       "        'Not so'],\n",
       "       ['The shapes in the large square never appear outside of it',\n",
       "        'At least one shape in the large square appears outside of it'],\n",
       "       ['Angle made by shapes with vertex at square is not acute',\n",
       "        'Angle made by shapes with vertex at square is acute'],\n",
       "       ['Square divided into four areas of the same size and shape',\n",
       "        'Not so'],\n",
       "       ['The two points are reachable through a path',\n",
       "        'The two points are unreachable by any path'],\n",
       "       ['Line joins large and small square',\n",
       "        'Line joins the two middle-sized squares'],\n",
       "       ['All three sizes are present',\n",
       "        'Only two of the three sizes present'],\n",
       "       ['“Ghost shape” is square', '“Ghost shape” is rectangular'],\n",
       "       ['One of the two small squares is near the lower-right corner',\n",
       "        'One of the two small squares is near the upper-right corner'],\n",
       "       ['Lines if slightly extended make up a regular polygon',\n",
       "        'Lines if slightly extended cannot make up a regular polygon'],\n",
       "       ['Acceleration and deceleration', 'Constant speed'],\n",
       "       ['Large and medium-sized square, the latter can be hidden',\n",
       "        'Large and small-sized square, the latter can be hidden'],\n",
       "       ['Collinear objects, of which the 3rd is moved elsewhere',\n",
       "        'Collinear objects, of which the 2nd/4th is moved elsewhere'],\n",
       "       ['Three objects are identical, the fourth differs', 'Not so'],\n",
       "       ['At least one (interior or exterior) right angle',\n",
       "        'No right angle (either interior or exterior)'],\n",
       "       ['Shapes identical after rotation',\n",
       "        'Shapes identical after rotation and mirroring'],\n",
       "       ['Ratio of inside to outside identical shapes is constant',\n",
       "        'Not so'],\n",
       "       ['Barycenter of each cluster of dots near a vertex  alternative:  Three or more small clusters of dots',\n",
       "        'Not so'],\n",
       "       ['Three or more small clusters of dots', 'Not so'],\n",
       "       ['Ball touches curve at a point of local minimum downwards',\n",
       "        'Ball touches curve at a point of local maximum upwards'],\n",
       "       ['Enclosed square “repelled” by the outside squares, closest to the side of the enclosing square that’s farthest from the common center of the outside squares.',\n",
       "        'Enclosed square “attracted” by the outside squares, closest to the side of the enclosing square that’s closest to the common center of the outside squares.'],\n",
       "       ['Number of sides – number of pluses = 3',\n",
       "        'Number of sides – number of pluses = 4'],\n",
       "       ['Lines intersect within the box',\n",
       "        'Lines intersect out of the box'],\n",
       "       ['Closed curves clockwise, open curves counterclockwise',\n",
       "        'Closed curves counterclockwise, open curves clockwise'],\n",
       "       ['Long distance between the marked locations',\n",
       "        'Short distance between the marked locations'],\n",
       "       ['One area unreachable by the marked locations',\n",
       "        'All areas reachable by the marked locations'],\n",
       "       ['At least one path is a cycle', 'No path is a cycle'],\n",
       "       ['Number of enclosed dots proportional to the circle size',\n",
       "        'Not so'],\n",
       "       ['The numbers of dots are in sequence', 'Not so'],\n",
       "       ['The number of dots in one cluster is a multiple of the other',\n",
       "        'Not so'],\n",
       "       ['The numbers of dots in the two clusters are approximately equal',\n",
       "        'The numbers of dots in the two clusters differ a lot'],\n",
       "       ['Small round object unreachable from the border of the box',\n",
       "        'Small round object reachable from the border of the box'],\n",
       "       ['One outer outline', 'More than one outer outline'],\n",
       "       ['Jigsaw puzzle pieces can be assembled into a square',\n",
       "        'Jigsaw puzzle pieces cannot be assembled into a square'],\n",
       "       ['Left shapes can be placed on top of each other to make right shape',\n",
       "        'Not so'],\n",
       "       ['Left shapes can combine by symmetric difference (“xor” logical operator) to make right shape',\n",
       "        'Left shapes can combine by intersection (“and” logical operator) to make right shape'],\n",
       "       ['Straight line tangent to circle',\n",
       "        'Straight line not tangent to circle'],\n",
       "       ['Straight line tangent to curve',\n",
       "        'Straight line not tangent to curve'],\n",
       "       ['All sides are equal', 'All angles are equal'],\n",
       "       ['Regular polygon', 'Not regular polygon'],\n",
       "       ['1-D (line drawing, locally straight line)', '2-D'],\n",
       "       ['2-D (surface, locally flat)', '3-D'],\n",
       "       ['Transparent solid', 'Opaque solid'],\n",
       "       ['Platonic solid (regular polyhedron)', 'Not a platonic solid'],\n",
       "       ['Odd number of dots', 'Even number of dots'],\n",
       "       ['Tessellates the plane', 'Does not tessellate the plane'],\n",
       "       ['One gear turns all', 'No gear turns all'],\n",
       "       ['Black is below upward slopes', 'Black is below downward slopes'],\n",
       "       ['High approximate similarity', 'Low approximate similarity'],\n",
       "       ['Union of left sets is right set',\n",
       "        'Intersection of left sets is right set'],\n",
       "       ['Regular star polygons that can be traced vertex-to-vertex in a continuous fashion',\n",
       "        'Not so'],\n",
       "       ['Strictly increasing or strictly decreasing border line',\n",
       "        'Both increasing and decreasing border line'],\n",
       "       ['Exactly one axis of symmetry',\n",
       "        'Either zero or more than one axis of symmetry'],\n",
       "       ['No two shapes are the same', 'At least two shapes are the same'],\n",
       "       ['Shape can tile with itself so as to create a parallelogram',\n",
       "        'Shape cannot tile with itself so as to create a parallelogram'],\n",
       "       ['Intersection of circle and square',\n",
       "        'Union of circle and square'],\n",
       "       ['Object on the right fits in category on the left',\n",
       "        'Object on the right does not fit in category on the left'],\n",
       "       ['No pattern (variety of shapes)',\n",
       "        'All shapes have something in common'],\n",
       "       ['Shape on the right is the convex hull of shape on the left',\n",
       "        'Not so'],\n",
       "       ['One object does not belong to the category of the rest',\n",
       "        'All objects form one category'],\n",
       "       ['Some quantity keeps increasing from left to right', 'Not so'],\n",
       "       ['Discrete quantity', 'Continuous quantity'],\n",
       "       ['Quantity has no lower bound', 'Quantity has lower bound'],\n",
       "       ['Increasing quantity may loop back to starting value',\n",
       "        'Increasing quantity cannot loop back to starting value'],\n",
       "       ['Angular quantity', 'Infinitely increasing quantity'],\n",
       "       ['Fractal iteration based on 2-D (shapes)',\n",
       "        'Fractal iteration based on 1-D (lines)'],\n",
       "       ['Object at lower-right fits as n-th item in the top row of objects, where n is the number of dots at lower-left',\n",
       "        'Not so'],\n",
       "       ['Decelerating change in quantity, left-to-right',\n",
       "        'Accelerating change in quantity, left-to-right'],\n",
       "       ['The circles will collide if the arrows are their velocities',\n",
       "        'The circles will not collide if the arrows are their velocities'],\n",
       "       ['Random arrangement of dots',\n",
       "        'Non-random (patterned) arrangement of dots'],\n",
       "       ['Order is high (low entropy)', 'Order is low (high entropy)'],\n",
       "       ['Analogy makes sense', 'Analogy does not make sense'],\n",
       "       ['Choice that solves the analogy exists',\n",
       "        'Choice that solves the analogy does not exist'],\n",
       "       ['Counterclockwise along the curve following the arrow',\n",
       "        'Clockwise along the curve following the arrow'],\n",
       "       ['Two clearly separable groups', 'No clearly separable groups'],\n",
       "       ['Two independent quantities changing simultaneously',\n",
       "        'A single quantity is changing'],\n",
       "       ['White dot is at center of mass',\n",
       "        'White dot is not at center of mass'],\n",
       "       ['Center of mass within the black area of the shape',\n",
       "        'Center of mass out of the black area of the shape'],\n",
       "       ['There is a point that can “see” (in straight lines) all points',\n",
       "        'There is no point that can “see” (in straight lines) all points'],\n",
       "       ['Pairs of points (small white circles) on one curve can be glued together to make the other curve',\n",
       "        'Not so'],\n",
       "       ['Gluing sides with the same symbols makes a sphere',\n",
       "        'Gluing sides with the same symbols makes a torus'],\n",
       "       ['Net (folding along edges can make a 3D solid)', 'No net'],\n",
       "       ['Object belongs to the left-hand side category',\n",
       "        'Object belongs to the right-hand side category'],\n",
       "       ['Intersection (logical conjunction)',\n",
       "        'Union (logical disjunction)'],\n",
       "       ['Simple object', 'Complex object'],\n",
       "       ['Representationally uniform', 'Representationally non-uniform'],\n",
       "       ['A “chess” piece moving as shown may reach every square',\n",
       "        'Not so'],\n",
       "       ['The two objects have similar representations',\n",
       "        'The two objects have dissimilar representations'],\n",
       "       ['The two objects are conceptually related',\n",
       "        'The two objects are conceptually unrelated'],\n",
       "       ['Complete set', 'Incomplete set'],\n",
       "       ['The set indicated by the objects is finite',\n",
       "        'The set indicated by the objects is infinite'],\n",
       "       ['Adding the top two waves yields the bottom wave', 'Not so'],\n",
       "       ['No knot (“unknot”)', 'Knot'],\n",
       "       ['When the shape is removed from the dots, the dots give enough information to place the shape back where it was',\n",
       "        'Not so'],\n",
       "       ['Square number of dots', 'Not a square number of dots'],\n",
       "       ['Nets of cubes', 'No nets of cubes'],\n",
       "       ['Lower shape can be used as a tile to build the upper one',\n",
       "        'Not so'],\n",
       "       ['Dots can be shared equally between figures',\n",
       "        'Dots cannot be shared equally between figures'],\n",
       "       ['White dot can “see” (in straight lines) all black points',\n",
       "        'White dot cannot “see” (in straight lines) all black points'],\n",
       "       ['Loops are “entangled” (in 3-D)',\n",
       "        'Loops can be separated (in 3-D)'],\n",
       "       ['Each graph vertex is uniquely defined by its connections (the graph does not admit nontrivial automorphisms)',\n",
       "        'The graph admits nontrivial automorphisms'],\n",
       "       ['There exists en edge such that removing it yields two disconnected graphs (i.e., the minimum number of edges whose removal results in two disconnected graphs is 1)',\n",
       "        'The minimum number of edges whose removal results in two disconnected graphs is 2'],\n",
       "       ['Exponential increase', 'Linear increase'],\n",
       "       ['Correct', 'Incorrect'],\n",
       "       ['For each colored square only, there exists a path starting on it that covers each square of the figure exactly once',\n",
       "        'There is no path that starts on a colored square and covers each square of the figure exactly once']],\n",
       "      dtype=object)"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "execution_count": 2
  },
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-07-27T14:46:01.593819Z",
     "start_time": "2024-07-27T14:46:01.587717Z"
    }
   },
   "cell_type": "code",
   "source": [
    "offset = 20\n",
    "correct = rules[0:100]\n",
    "incorrect = np.concatenate((rules[offset:100], rules[0:offset]), axis=0)\n",
    "correct.shape, incorrect.shape"
   ],
   "id": "4724921f8a0dcca7",
   "outputs": [
    {
     "data": {
      "text/plain": [
       "((100, 2), (100, 2))"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "execution_count": 3
  },
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-07-27T14:46:03.821774Z",
     "start_time": "2024-07-27T14:46:03.814162Z"
    }
   },
   "cell_type": "code",
   "source": [
    "edit_distance_ratio_warning_threshold = 0.7\n",
    "for i, (correct_concepts, incorrect_concepts) in enumerate(zip(correct, incorrect)):\n",
    "    left_distance = editdistance.eval(correct_concepts[0], incorrect_concepts[0])\n",
    "    right_distance = editdistance.eval(correct_concepts[1], incorrect_concepts[1])\n",
    "    left_ratio = left_distance / max(len(correct_concepts[0]), len(incorrect_concepts[0]))\n",
    "    right_ratio = right_distance / max(len(correct_concepts[1]), len(incorrect_concepts[1]))\n",
    "    print(\n",
    "        i,\n",
    "        \"-\",\n",
    "        f\"Left ED: {left_distance:02d} ({int(left_ratio * 100)}%)\",\n",
    "        \"-\",\n",
    "        f\"Right ED: {right_distance:02d} ({int(right_ratio * 100)}%)\",\n",
    "    )\n",
    "    if left_ratio < edit_distance_ratio_warning_threshold:\n",
    "        print(\"    \", \"Left\", left_distance, \"    Correct:\",\n",
    "              correct_concepts[0], \"    Incorrect:\", incorrect_concepts[0])\n",
    "    if right_ratio < edit_distance_ratio_warning_threshold:\n",
    "        print(\"    \", \"Right\", right_distance, \"    Correct:\",\n",
    "              correct_concepts[1], \"    Incorrect:\", incorrect_concepts[1])"
   ],
   "id": "31e76b2cd708a71f",
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 - Left ED: 15 (75%) - Right ED: 16 (69%)\n",
      "     Right 16     Correct: Not empty picture     Incorrect: No small figure present\n",
      "1 - Left ED: 27 (75%) - Right ED: 22 (70%)\n",
      "2 - Left ED: 05 (33%) - Right ED: 05 (38%)\n",
      "     Left 5     Correct: Outline figures     Incorrect: One figure\n",
      "     Right 5     Correct: Solid figures     Incorrect: Two figures\n",
      "3 - Left ED: 11 (78%) - Right ED: 12 (70%)\n",
      "4 - Left ED: 24 (92%) - Right ED: 20 (83%)\n",
      "5 - Left ED: 14 (70%) - Right ED: 17 (73%)\n",
      "6 - Left ED: 23 (82%) - Right ED: 24 (80%)\n",
      "7 - Left ED: 21 (84%) - Right ED: 18 (75%)\n",
      "8 - Left ED: 54 (80%) - Right ED: 54 (79%)\n",
      "9 - Left ED: 23 (85%) - Right ED: 27 (90%)\n",
      "10 - Left ED: 12 (70%) - Right ED: 11 (73%)\n",
      "11 - Left ED: 26 (83%) - Right ED: 24 (82%)\n",
      "12 - Left ED: 35 (83%) - Right ED: 33 (78%)\n",
      "13 - Left ED: 17 (73%) - Right ED: 17 (73%)\n",
      "14 - Left ED: 44 (86%) - Right ED: 49 (87%)\n",
      "15 - Left ED: 21 (72%) - Right ED: 17 (77%)\n",
      "16 - Left ED: 20 (66%) - Right ED: 19 (79%)\n",
      "     Left 20     Correct: An acute angle directed inward     Incorrect: Triangle above circle\n",
      "17 - Left ED: 24 (88%) - Right ED: 25 (89%)\n",
      "18 - Left ED: 32 (84%) - Right ED: 26 (89%)\n",
      "19 - Left ED: 26 (68%) - Right ED: 29 (72%)\n",
      "     Left 26     Correct: Points located on one side of the neck     Incorrect: Three points on a straight line\n",
      "20 - Left ED: 28 (77%) - Right ED: 33 (82%)\n",
      "21 - Left ED: 41 (74%) - Right ED: 44 (74%)\n",
      "22 - Left ED: 46 (88%) - Right ED: 44 (84%)\n",
      "23 - Left ED: 24 (77%) - Right ED: 17 (70%)\n",
      "24 - Left ED: 28 (65%) - Right ED: 20 (54%)\n",
      "     Left 28     Correct: Black figure is a triangle     Incorrect: Outline figure on top of solid black figure\n",
      "     Right 20     Correct: Black figure is a circle     Incorrect: Black figure on top of outline figure\n",
      "25 - Left ED: 23 (79%) - Right ED: 18 (62%)\n",
      "     Right 18     Correct: No solid black triangle     Incorrect: Circle on top of the triangle\n",
      "26 - Left ED: 22 (75%) - Right ED: 22 (75%)\n",
      "27 - Left ED: 33 (75%) - Right ED: 33 (75%)\n",
      "28 - Left ED: 56 (68%) - Right ED: 61 (74%)\n",
      "     Left 56     Correct: There are more small circles inside the figure outline than outside     Incorrect: Points inside the figure outline are grouped more densely than outside the contour\n",
      "29 - Left ED: 22 (81%) - Right ED: 25 (83%)\n",
      "30 - Left ED: 27 (87%) - Right ED: 28 (82%)\n",
      "31 - Left ED: 29 (74%) - Right ED: 27 (72%)\n",
      "32 - Left ED: 42 (84%) - Right ED: 40 (81%)\n",
      "33 - Left ED: 44 (80%) - Right ED: 40 (83%)\n",
      "34 - Left ED: 49 (68%) - Right ED: 51 (69%)\n",
      "     Left 49     Correct: The axis of the hole is parallel to the figure axis     Incorrect: A circle is at the left of the cavity if you look from inside the figure\n",
      "     Right 51     Correct: The axis of the hole is perpendicular to the figure axis     Incorrect: A circle is at the right of the cavity if you look from inside the figure\n",
      "35 - Left ED: 22 (75%) - Right ED: 22 (81%)\n",
      "36 - Left ED: 17 (80%) - Right ED: 17 (80%)\n",
      "37 - Left ED: 27 (75%) - Right ED: 28 (77%)\n",
      "38 - Left ED: 30 (78%) - Right ED: 22 (75%)\n",
      "39 - Left ED: 25 (80%) - Right ED: 27 (79%)\n",
      "40 - Left ED: 26 (72%) - Right ED: 31 (70%)\n",
      "41 - Left ED: 36 (65%) - Right ED: 38 (64%)\n",
      "     Left 36     Correct: Points inside the figure outline are on a straight line     Incorrect: Ends of the curve are far apart\n",
      "     Right 38     Correct: Points inside the figure outline are not on a straight line     Incorrect: Ends of the curve are close together\n",
      "42 - Left ED: 39 (75%) - Right ED: 37 (71%)\n",
      "43 - Left ED: 41 (74%) - Right ED: 43 (76%)\n",
      "44 - Left ED: 38 (88%) - Right ED: 33 (84%)\n",
      "45 - Left ED: 30 (75%) - Right ED: 27 (71%)\n",
      "46 - Left ED: 43 (69%) - Right ED: 44 (72%)\n",
      "     Left 43     Correct: Triangle inside of the circle     Incorrect: The right branch begins at a higher point than the left branch\n",
      "47 - Left ED: 48 (72%) - Right ED: 49 (75%)\n",
      "48 - Left ED: 65 (79%) - Right ED: 64 (78%)\n",
      "49 - Left ED: 38 (82%) - Right ED: 33 (76%)\n",
      "50 - Left ED: 31 (70%) - Right ED: 34 (72%)\n",
      "51 - Left ED: 30 (76%) - Right ED: 28 (75%)\n",
      "52 - Left ED: 46 (76%) - Right ED: 43 (78%)\n",
      "53 - Left ED: 44 (80%) - Right ED: 37 (77%)\n",
      "54 - Left ED: 50 (69%) - Right ED: 51 (69%)\n",
      "     Left 50     Correct: A circle is at the left of the cavity if you look from inside the figure     Incorrect: Triangle located at the concave side of an arc\n",
      "     Right 51     Correct: A circle is at the right of the cavity if you look from inside the figure     Incorrect: Triangle located at the convex side of an arc\n",
      "55 - Left ED: 23 (79%) - Right ED: 21 (77%)\n",
      "56 - Left ED: 18 (85%) - Right ED: 14 (56%)\n",
      "     Right 14     Correct: Figures not identical     Incorrect: Angle not divided in half\n",
      "57 - Left ED: 35 (85%) - Right ED: 39 (81%)\n",
      "58 - Left ED: 54 (81%) - Right ED: 53 (80%)\n",
      "59 - Left ED: 38 (77%) - Right ED: 41 (82%)\n",
      "60 - Left ED: 111 (81%) - Right ED: 86 (74%)\n",
      "61 - Left ED: 42 (70%) - Right ED: 49 (72%)\n",
      "62 - Left ED: 37 (80%) - Right ED: 37 (78%)\n",
      "63 - Left ED: 43 (78%) - Right ED: 41 (73%)\n",
      "64 - Left ED: 35 (85%) - Right ED: 33 (84%)\n",
      "65 - Left ED: 34 (85%) - Right ED: 32 (84%)\n",
      "66 - Left ED: 57 (91%) - Right ED: 55 (90%)\n",
      "67 - Left ED: 58 (87%) - Right ED: 60 (92%)\n",
      "68 - Left ED: 28 (82%) - Right ED: 27 (84%)\n",
      "69 - Left ED: 37 (80%) - Right ED: 38 (88%)\n",
      "70 - Left ED: 30 (68%) - Right ED: 37 (78%)\n",
      "     Left 30     Correct: There are inside figures of the second order     Incorrect: Three identical elements\n",
      "71 - Left ED: 24 (80%) - Right ED: 26 (74%)\n",
      "72 - Left ED: 46 (76%) - Right ED: 39 (70%)\n",
      "73 - Left ED: 22 (68%) - Right ED: 20 (64%)\n",
      "     Left 22     Correct: A tail grows from the obtuse end     Incorrect: Solid dark circle not at end\n",
      "     Right 20     Correct: A tail grows from the acute end     Incorrect: Solid dark circle at end\n",
      "74 - Left ED: 36 (78%) - Right ED: 34 (75%)\n",
      "75 - Left ED: 16 (88%) - Right ED: 15 (88%)\n",
      "76 - Left ED: 19 (90%) - Right ED: 23 (92%)\n",
      "77 - Left ED: 36 (87%) - Right ED: 44 (91%)\n",
      "78 - Left ED: 48 (72%) - Right ED: 46 (69%)\n",
      "     Right 46     Correct: A dark circle is closer to the triangle than to the outline circle     Incorrect: Outlines made by triangles and circles do not intersect\n",
      "79 - Left ED: 41 (83%) - Right ED: 42 (84%)\n",
      "80 - Left ED: 127 (93%) - Right ED: 103 (89%)\n",
      "81 - Left ED: 54 (90%) - Right ED: 61 (89%)\n",
      "82 - Left ED: 34 (73%) - Right ED: 36 (76%)\n",
      "83 - Left ED: 41 (80%) - Right ED: 39 (78%)\n",
      "84 - Left ED: 10 (90%) - Right ED: 14 (73%)\n",
      "85 - Left ED: 08 (72%) - Right ED: 10 (90%)\n",
      "86 - Left ED: 21 (75%) - Right ED: 23 (76%)\n",
      "87 - Left ED: 19 (76%) - Right ED: 18 (75%)\n",
      "88 - Left ED: 18 (81%) - Right ED: 20 (83%)\n",
      "89 - Left ED: 08 (72%) - Right ED: 09 (81%)\n",
      "90 - Left ED: 21 (87%) - Right ED: 19 (82%)\n",
      "91 - Left ED: 26 (83%) - Right ED: 24 (82%)\n",
      "92 - Left ED: 31 (73%) - Right ED: 30 (71%)\n",
      "93 - Left ED: 23 (82%) - Right ED: 19 (79%)\n",
      "94 - Left ED: 13 (59%) - Right ED: 17 (70%)\n",
      "     Left 13     Correct: Vertical hatched lines     Incorrect: Closed lines\n",
      "95 - Left ED: 24 (82%) - Right ED: 18 (81%)\n",
      "96 - Left ED: 25 (83%) - Right ED: 20 (83%)\n",
      "97 - Left ED: 08 (88%) - Right ED: 10 (90%)\n",
      "98 - Left ED: 42 (87%) - Right ED: 49 (89%)\n",
      "99 - Left ED: 33 (86%) - Right ED: 34 (85%)\n"
     ]
    }
   ],
   "execution_count": 4
  },
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-07-27T14:46:04.622738Z",
     "start_time": "2024-07-27T14:46:04.615121Z"
    }
   },
   "cell_type": "code",
   "source": [
    "lcs_warning_threshold = 2\n",
    "for i, (correct_concepts, incorrect_concepts) in enumerate(zip(correct, incorrect)):\n",
    "    left_lcs = get_longest_common_word_subsequence_length(correct_concepts[0], incorrect_concepts[0])\n",
    "    right_lcs = get_longest_common_word_subsequence_length(correct_concepts[1], incorrect_concepts[1])\n",
    "    left_ratio = left_lcs / min(len(correct_concepts[0]), len(incorrect_concepts[0]))\n",
    "    right_ratio = right_lcs / min(len(correct_concepts[1]), len(incorrect_concepts[1]))\n",
    "    print(\n",
    "        i,\n",
    "        \"-\",\n",
    "        f\"Left LCS: {left_lcs} ({int(left_ratio * 100)}%)\",\n",
    "        \"-\",\n",
    "        f\"Right LCS: {right_lcs} ({int(right_ratio * 100)}%)\",\n",
    "    )\n",
    "    if left_lcs >= lcs_warning_threshold:\n",
    "        print(\"    \", \"Left\", \"    Correct:\", correct_concepts[0], \"    Incorrect:\", incorrect_concepts[0])\n",
    "    if right_lcs >= lcs_warning_threshold:\n",
    "        print(\"    \", \"Right\", \"    Correct:\", correct_concepts[1], \"    Incorrect:\", incorrect_concepts[1])"
   ],
   "id": "2bcfe2102133f46",
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "1 - Left LCS: 1 (7%) - Right LCS: 1 (7%)\n",
      "2 - Left LCS: 0 (0%) - Right LCS: 1 (9%)\n",
      "3 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "4 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "5 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "6 - Left LCS: 1 (4%) - Right LCS: 1 (5%)\n",
      "7 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "8 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "9 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "10 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "11 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "12 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "13 - Left LCS: 1 (8%) - Right LCS: 1 (8%)\n",
      "14 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "15 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "16 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "17 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "18 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "19 - Left LCS: 2 (6%) - Right LCS: 2 (5%)\n",
      "     Left     Correct: Points located on one side of the neck     Incorrect: Three points on a straight line\n",
      "     Right     Correct: Points located on both sides of the neck     Incorrect: No three points on a straight line\n",
      "20 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "21 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "22 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "23 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "24 - Left LCS: 2 (7%) - Right LCS: 2 (8%)\n",
      "     Left     Correct: Black figure is a triangle     Incorrect: Outline figure on top of solid black figure\n",
      "     Right     Correct: Black figure is a circle     Incorrect: Black figure on top of outline figure\n",
      "25 - Left LCS: 1 (5%) - Right LCS: 1 (4%)\n",
      "26 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "27 - Left LCS: 1 (4%) - Right LCS: 1 (5%)\n",
      "28 - Left LCS: 6 (8%) - Right LCS: 4 (5%)\n",
      "     Left     Correct: There are more small circles inside the figure outline than outside     Incorrect: Points inside the figure outline are grouped more densely than outside the contour\n",
      "     Right     Correct: There are fewer small circles inside the figure outline than outside     Incorrect: Points outside the figure contour are grouped more densely than inside the contour\n",
      "29 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "30 - Left LCS: 0 (0%) - Right LCS: 1 (11%)\n",
      "31 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "32 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "33 - Left LCS: 1 (8%) - Right LCS: 1 (8%)\n",
      "34 - Left LCS: 5 (9%) - Right LCS: 5 (8%)\n",
      "     Left     Correct: The axis of the hole is parallel to the figure axis     Incorrect: A circle is at the left of the cavity if you look from inside the figure\n",
      "     Right     Correct: The axis of the hole is perpendicular to the figure axis     Incorrect: A circle is at the right of the cavity if you look from inside the figure\n",
      "35 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "36 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "37 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "38 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "39 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "40 - Left LCS: 1 (2%) - Right LCS: 1 (2%)\n",
      "41 - Left LCS: 2 (6%) - Right LCS: 2 (5%)\n",
      "     Left     Correct: Points inside the figure outline are on a straight line     Incorrect: Ends of the curve are far apart\n",
      "     Right     Correct: Points inside the figure outline are not on a straight line     Incorrect: Ends of the curve are close together\n",
      "42 - Left LCS: 1 (3%) - Right LCS: 1 (3%)\n",
      "43 - Left LCS: 1 (3%) - Right LCS: 1 (4%)\n",
      "44 - Left LCS: 1 (2%) - Right LCS: 1 (2%)\n",
      "45 - Left LCS: 1 (3%) - Right LCS: 1 (3%)\n",
      "46 - Left LCS: 1 (3%) - Right LCS: 1 (3%)\n",
      "47 - Left LCS: 2 (4%) - Right LCS: 2 (4%)\n",
      "     Left     Correct: Solid dark figures above the outline figures     Incorrect: The end of the right branch is higher than that of the left branch\n",
      "     Right     Correct: Outline figures above the solid dark figures     Incorrect: The end of the right branch is lower than that of the left branch\n",
      "48 - Left LCS: 1 (2%) - Right LCS: 0 (0%)\n",
      "49 - Left LCS: 1 (6%) - Right LCS: 1 (5%)\n",
      "50 - Left LCS: 0 (0%) - Right LCS: 1 (2%)\n",
      "51 - Left LCS: 0 (0%) - Right LCS: 1 (2%)\n",
      "52 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "53 - Left LCS: 1 (3%) - Right LCS: 1 (3%)\n",
      "54 - Left LCS: 3 (6%) - Right LCS: 3 (6%)\n",
      "     Left     Correct: A circle is at the left of the cavity if you look from inside the figure     Incorrect: Triangle located at the concave side of an arc\n",
      "     Right     Correct: A circle is at the right of the cavity if you look from inside the figure     Incorrect: Triangle located at the convex side of an arc\n",
      "55 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "56 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "57 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "58 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "59 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "60 - Left LCS: 2 (5%) - Right LCS: 2 (4%)\n",
      "     Left     Correct: A line separates the crosses in half     Incorrect: Dark figures can be divided from outline figures by a straight line  alternatively:  Convex hulls of filled and outlined figures overlap\n",
      "     Right     Correct: A line does not separate the crosses in half     Incorrect: Dark figures are impossible to separate  alternatively:  Convex hulls of filled and outlined figures do not overlap\n",
      "61 - Left LCS: 2 (6%) - Right LCS: 2 (5%)\n",
      "     Left     Correct: Ends of the curve are far apart     Incorrect: The convex hull of the crosses forms an equilateral triangle\n",
      "     Right     Correct: Ends of the curve are close together     Incorrect: The convex hull of the crosses does not form an equilateral triangle\n",
      "62 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "63 - Left LCS: 3 (5%) - Right LCS: 3 (6%)\n",
      "     Left     Correct: A cross is located on the extension of the ellipse axis     Incorrect: A quadrangle is outside of a figure made by circles\n",
      "     Right     Correct: A circle is located on the extension of the ellipse axis     Incorrect: A quadrangle is inside of a figure made by circles\n",
      "64 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "65 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "66 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "67 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "68 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "69 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "70 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "71 - Left LCS: 1 (4%) - Right LCS: 1 (5%)\n",
      "72 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "73 - Left LCS: 1 (3%) - Right LCS: 1 (4%)\n",
      "74 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "75 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "76 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "77 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "78 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "79 - Left LCS: 1 (8%) - Right LCS: 0 (0%)\n",
      "80 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "81 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "82 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "83 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "84 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "85 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "86 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "87 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "88 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "89 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "90 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "91 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "92 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "93 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "94 - Left LCS: 1 (8%) - Right LCS: 1 (10%)\n",
      "95 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "96 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "97 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "98 - Left LCS: 0 (0%) - Right LCS: 0 (0%)\n",
      "99 - Left LCS: 1 (8%) - Right LCS: 1 (8%)\n"
     ]
    }
   ],
   "execution_count": 5
  },
  {
   "metadata": {},
   "cell_type": "markdown",
   "source": "## Bongard OpenWorld",
   "id": "8d6e0e1e8fb4bcde"
  },
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-08-01T16:51:06.481236Z",
     "start_time": "2024-08-01T16:51:06.437557Z"
    }
   },
   "cell_type": "code",
   "source": [
    "rules = pd.read_csv(\"../data/raw/bongard_open_world_labels.csv\")[[\"Left-side Rule\", \"Right-side Rule\"]].values\n",
    "rules"
   ],
   "id": "120c6bfc973e8e1",
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([['Fashion magazine.', 'NOT Fashion magazine.'],\n",
       "       ['Solar system.', 'NOT Solar system.'],\n",
       "       ['A bunch of branches on the green plant.',\n",
       "        'NOT A bunch of branches on the green plant.'],\n",
       "       ...,\n",
       "       ['A bouquet of flowers with oval petals.',\n",
       "        'NOT A bouquet of flowers with oval petals.'],\n",
       "       ['A civilian aircraft.', 'NOT A civilian aircraft.'],\n",
       "       ['Yellow mushrooms.', 'NOT Yellow mushrooms.']], dtype=object)"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "execution_count": 2
  },
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-08-01T16:51:12.652259Z",
     "start_time": "2024-08-01T16:51:12.645967Z"
    }
   },
   "cell_type": "code",
   "source": [
    "offset = 20\n",
    "correct = rules[0:100]\n",
    "incorrect = np.concatenate((rules[offset:100], rules[0:offset]), axis=0)\n",
    "correct.shape, incorrect.shape"
   ],
   "id": "e430b76fb7876a5f",
   "outputs": [
    {
     "data": {
      "text/plain": [
       "((100, 2), (100, 2))"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "execution_count": 3
  },
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-08-01T16:51:22.342552Z",
     "start_time": "2024-08-01T16:51:22.325508Z"
    }
   },
   "cell_type": "code",
   "source": [
    "edit_distance_ratio_warning_threshold = 0.7\n",
    "for i, (correct_concepts, incorrect_concepts) in enumerate(zip(correct, incorrect)):\n",
    "    left_distance = editdistance.eval(correct_concepts[0], incorrect_concepts[0])\n",
    "    right_distance = editdistance.eval(correct_concepts[1], incorrect_concepts[1])\n",
    "    left_ratio = left_distance / max(len(correct_concepts[0]), len(incorrect_concepts[0]))\n",
    "    right_ratio = right_distance / max(len(correct_concepts[1]), len(incorrect_concepts[1]))\n",
    "    print(\n",
    "        i,\n",
    "        \"-\",\n",
    "        f\"Left ED: {left_distance:02d} ({int(left_ratio * 100)}%)\",\n",
    "        \"-\",\n",
    "        f\"Right ED: {right_distance:02d} ({int(right_ratio * 100)}%)\",\n",
    "    )\n",
    "    if left_ratio < edit_distance_ratio_warning_threshold:\n",
    "        print(\"    \", \"Left\", left_distance, \"    Correct:\", correct_concepts[0], \"    Incorrect:\", incorrect_concepts[0])\n",
    "    if right_ratio < edit_distance_ratio_warning_threshold:\n",
    "        print(\"    \", \"Right\", right_distance, \"    Correct:\", correct_concepts[1], \"    Incorrect:\", incorrect_concepts[1])"
   ],
   "id": "a331be92ffa56d3f",
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 - Left ED: 20 (83%) - Right ED: 20 (71%)\n",
      "1 - Left ED: 27 (79%) - Right ED: 27 (71%)\n",
      "2 - Left ED: 32 (82%) - Right ED: 32 (74%)\n",
      "3 - Left ED: 29 (78%) - Right ED: 29 (70%)\n",
      "4 - Left ED: 24 (68%) - Right ED: 24 (61%)\n",
      "     Left 24     Correct: A pile of rusty metal bolts.     Incorrect: The top of a snow covered mountain.\n",
      "     Right 24     Correct: NOT A pile of rusty metal bolts.     Incorrect: NOT The top of a snow covered mountain.\n",
      "5 - Left ED: 21 (75%) - Right ED: 21 (65%)\n",
      "     Right 21     Correct: NOT A large wheat field.     Incorrect: NOT Steel beams of the building.\n",
      "6 - Left ED: 22 (64%) - Right ED: 22 (57%)\n",
      "     Left 22     Correct: Rubber kayak in the water.     Incorrect: People walking on the city street.\n",
      "     Right 22     Correct: NOT Rubber kayak in the water.     Incorrect: NOT People walking on the city street.\n",
      "7 - Left ED: 38 (80%) - Right ED: 38 (74%)\n",
      "8 - Left ED: 27 (75%) - Right ED: 27 (67%)\n",
      "     Right 27     Correct: NOT A perched mantis hanging on a plant.     Incorrect: NOT Keyboard of the piano.\n",
      "9 - Left ED: 30 (81%) - Right ED: 30 (73%)\n",
      "10 - Left ED: 24 (77%) - Right ED: 24 (68%)\n",
      "     Right 24     Correct: NOT Ellipsoidal fruits.     Incorrect: NOT Hand-held escalators on stairs.\n",
      "11 - Left ED: 21 (80%) - Right ED: 21 (70%)\n",
      "12 - Left ED: 30 (81%) - Right ED: 30 (73%)\n",
      "13 - Left ED: 34 (79%) - Right ED: 34 (72%)\n",
      "14 - Left ED: 22 (75%) - Right ED: 22 (66%)\n",
      "     Right 22     Correct: NOT A person playing a guitar.     Incorrect: NOT The tungsten lamp is glowing.\n",
      "15 - Left ED: 22 (78%) - Right ED: 22 (68%)\n",
      "     Right 22     Correct: NOT Bright red fish.     Incorrect: NOT The house in the heavy snow.\n",
      "16 - Left ED: 33 (75%) - Right ED: 33 (68%)\n",
      "     Right 33     Correct: NOT Reeds swaying in the wind.     Incorrect: NOT A small wooden boat floating on a calm lake.\n",
      "17 - Left ED: 36 (78%) - Right ED: 36 (72%)\n",
      "18 - Left ED: 31 (73%) - Right ED: 31 (67%)\n",
      "     Right 31     Correct: NOT Various colors of pigments.     Incorrect: NOT Human footprints in the sand on the beach.\n",
      "19 - Left ED: 62 (83%) - Right ED: 62 (79%)\n",
      "20 - Left ED: 20 (83%) - Right ED: 20 (71%)\n",
      "21 - Left ED: 27 (79%) - Right ED: 27 (71%)\n",
      "22 - Left ED: 25 (75%) - Right ED: 25 (67%)\n",
      "     Right 25     Correct: NOT Grilled steaks.     Incorrect: NOT Monsters in mythological stories.\n",
      "23 - Left ED: 26 (83%) - Right ED: 26 (74%)\n",
      "24 - Left ED: 27 (77%) - Right ED: 27 (69%)\n",
      "     Right 27     Correct: NOT The top of a snow covered mountain.     Incorrect: NOT Little kids steering cars.\n",
      "25 - Left ED: 22 (78%) - Right ED: 22 (68%)\n",
      "     Right 22     Correct: NOT Steel beams of the building.     Incorrect: NOT Dense binary numbers.\n",
      "26 - Left ED: 21 (61%) - Right ED: 21 (55%)\n",
      "     Left 21     Correct: People walking on the city street.     Incorrect: Traces left on the sand dunes.\n",
      "     Right 21     Correct: NOT People walking on the city street.     Incorrect: NOT Traces left on the sand dunes.\n",
      "27 - Left ED: 32 (68%) - Right ED: 32 (62%)\n",
      "     Left 32     Correct: A christmas ornament tree with colorful lights.     Incorrect: A closeup of a red brick wall.\n",
      "     Right 32     Correct: NOT A christmas ornament tree with colorful lights.     Incorrect: NOT A closeup of a red brick wall.\n",
      "28 - Left ED: 18 (81%) - Right ED: 18 (69%)\n",
      "     Right 18     Correct: NOT Keyboard of the piano.     Incorrect: NOT Black horse.\n",
      "29 - Left ED: 30 (81%) - Right ED: 30 (73%)\n",
      "30 - Left ED: 25 (80%) - Right ED: 25 (71%)\n",
      "31 - Left ED: 31 (81%) - Right ED: 31 (73%)\n",
      "32 - Left ED: 27 (72%) - Right ED: 27 (65%)\n",
      "     Right 27     Correct: NOT Tractors are working on a farm field.     Incorrect: NOT Persons riding bicycles.\n",
      "33 - Left ED: 26 (76%) - Right ED: 26 (68%)\n",
      "     Right 26     Correct: NOT A bicycle is placed in the corner.     Incorrect: NOT Men playing basketball.\n",
      "34 - Left ED: 20 (68%) - Right ED: 20 (60%)\n",
      "     Left 20     Correct: The tungsten lamp is glowing.     Incorrect: Wrestling competition.\n",
      "     Right 20     Correct: NOT The tungsten lamp is glowing.     Incorrect: NOT Wrestling competition.\n",
      "35 - Left ED: 27 (79%) - Right ED: 27 (71%)\n",
      "36 - Left ED: 34 (77%) - Right ED: 34 (70%)\n",
      "37 - Left ED: 34 (73%) - Right ED: 34 (68%)\n",
      "     Right 34     Correct: NOT The girl has long and thin braids on her head.     Incorrect: NOT An aerial view of the city.\n",
      "38 - Left ED: 33 (67%) - Right ED: 33 (62%)\n",
      "     Left 33     Correct: Human footprints in the sand on the beach.     Incorrect: Huge crystal chandelier hanging from the ceiling.\n",
      "     Right 33     Correct: NOT Human footprints in the sand on the beach.     Incorrect: NOT Huge crystal chandelier hanging from the ceiling.\n",
      "39 - Left ED: 28 (77%) - Right ED: 28 (70%)\n",
      "40 - Left ED: 31 (77%) - Right ED: 31 (70%)\n",
      "41 - Left ED: 26 (78%) - Right ED: 26 (70%)\n",
      "42 - Left ED: 27 (81%) - Right ED: 27 (72%)\n",
      "43 - Left ED: 24 (77%) - Right ED: 24 (68%)\n",
      "     Right 24     Correct: NOT Lettuce in the vegetable patch.     Incorrect: NOT White snowflakes.\n",
      "44 - Left ED: 20 (76%) - Right ED: 20 (66%)\n",
      "     Right 20     Correct: NOT Little kids steering cars.     Incorrect: NOT Fried noodles.\n",
      "45 - Left ED: 20 (71%) - Right ED: 20 (62%)\n",
      "     Right 20     Correct: NOT Dense binary numbers.     Incorrect: NOT A warning board in the wild.\n",
      "46 - Left ED: 23 (76%) - Right ED: 23 (67%)\n",
      "     Right 23     Correct: NOT Traces left on the sand dunes.     Incorrect: NOT A pile of bullet shells.\n",
      "47 - Left ED: 23 (76%) - Right ED: 23 (67%)\n",
      "     Right 23     Correct: NOT A closeup of a red brick wall.     Incorrect: NOT Colorful skulls.\n",
      "48 - Left ED: 45 (86%) - Right ED: 45 (80%)\n",
      "49 - Left ED: 25 (65%) - Right ED: 25 (59%)\n",
      "     Left 25     Correct: A soldier with a little girl.     Incorrect: A person doing yoga in the wilderness.\n",
      "     Right 25     Correct: NOT A soldier with a little girl.     Incorrect: NOT A person doing yoga in the wilderness.\n",
      "50 - Left ED: 23 (79%) - Right ED: 23 (69%)\n",
      "     Right 23     Correct: NOT Aircraft carrier.     Incorrect: NOT Gift boxes tied with ribbons.\n",
      "51 - Left ED: 33 (86%) - Right ED: 33 (78%)\n",
      "52 - Left ED: 34 (75%) - Right ED: 34 (69%)\n",
      "     Right 34     Correct: NOT Persons riding bicycles.     Incorrect: NOT A little girl dressed in a butterfly costume.\n",
      "53 - Left ED: 40 (78%) - Right ED: 40 (72%)\n",
      "54 - Left ED: 25 (78%) - Right ED: 25 (69%)\n",
      "     Right 25     Correct: NOT Wrestling competition.     Incorrect: NOT A delicious round birthday cake.\n",
      "55 - Left ED: 27 (79%) - Right ED: 27 (71%)\n",
      "56 - Left ED: 29 (74%) - Right ED: 29 (67%)\n",
      "     Right 29     Correct: NOT Police officers standing in the street.     Incorrect: NOT Various kinds of rings.\n",
      "57 - Left ED: 21 (77%) - Right ED: 21 (67%)\n",
      "     Right 21     Correct: NOT An aerial view of the city.     Incorrect: NOT Waterfront terrace.\n",
      "58 - Left ED: 39 (79%) - Right ED: 39 (73%)\n",
      "59 - Left ED: 29 (80%) - Right ED: 29 (72%)\n",
      "60 - Left ED: 29 (72%) - Right ED: 29 (65%)\n",
      "     Right 29     Correct: NOT A mesmerizing light show at the concert.     Incorrect: NOT A closeup view of cat.\n",
      "61 - Left ED: 26 (83%) - Right ED: 26 (74%)\n",
      "62 - Left ED: 20 (71%) - Right ED: 20 (62%)\n",
      "     Right 20     Correct: NOT A bunch of vibrant flowers.     Incorrect: NOT Live coral on the sea floor.\n",
      "63 - Left ED: 23 (82%) - Right ED: 23 (71%)\n",
      "64 - Left ED: 35 (83%) - Right ED: 35 (76%)\n",
      "65 - Left ED: 21 (70%) - Right ED: 21 (61%)\n",
      "     Right 21     Correct: NOT A warning board in the wild.     Incorrect: NOT A building with stone columns.\n",
      "66 - Left ED: 18 (75%) - Right ED: 18 (64%)\n",
      "     Right 18     Correct: NOT A pile of bullet shells.     Incorrect: NOT A transparent glass.\n",
      "67 - Left ED: 25 (83%) - Right ED: 25 (73%)\n",
      "68 - Left ED: 35 (67%) - Right ED: 35 (62%)\n",
      "     Left 35     Correct: A geometric painting in the style of abstractionist.     Incorrect: Boats sailing on a serene lake.\n",
      "     Right 35     Correct: NOT A geometric painting in the style of abstractionist.     Incorrect: NOT Boats sailing on a serene lake.\n",
      "69 - Left ED: 21 (55%) - Right ED: 21 (50%)\n",
      "     Left 21     Correct: A person doing yoga in the wilderness.     Incorrect: A person holding a camera.\n",
      "     Right 21     Correct: NOT A person doing yoga in the wilderness.     Incorrect: NOT A person holding a camera.\n",
      "70 - Left ED: 22 (75%) - Right ED: 22 (66%)\n",
      "     Right 22     Correct: NOT Gift boxes tied with ribbons.     Incorrect: NOT Knitted sweater.\n",
      "71 - Left ED: 12 (80%) - Right ED: 12 (63%)\n",
      "     Right 12     Correct: NOT Hockey stadium.     Incorrect: NOT Red bows.\n",
      "72 - Left ED: 34 (75%) - Right ED: 34 (69%)\n",
      "     Right 34     Correct: NOT A little girl dressed in a butterfly costume.     Incorrect: NOT A heart shaped symbol.\n",
      "73 - Left ED: 34 (66%) - Right ED: 34 (61%)\n",
      "     Left 34     Correct: A group of sheep grazing on a field of green grass.     Incorrect: A row of red wine bottles.\n",
      "     Right 34     Correct: NOT A group of sheep grazing on a field of green grass.     Incorrect: NOT A row of red wine bottles.\n",
      "74 - Left ED: 24 (75%) - Right ED: 24 (66%)\n",
      "     Right 24     Correct: NOT A delicious round birthday cake.     Incorrect: NOT Tennis racket or court.\n",
      "75 - Left ED: 17 (58%) - Right ED: 17 (51%)\n",
      "     Left 17     Correct: A girl leading a horse.     Incorrect: A man is training at the gym.\n",
      "     Right 17     Correct: NOT A girl leading a horse.     Incorrect: NOT A man is training at the gym.\n",
      "76 - Left ED: 22 (73%) - Right ED: 22 (64%)\n",
      "     Right 22     Correct: NOT Various kinds of rings.     Incorrect: NOT Keyboard of an old typewriter.\n",
      "77 - Left ED: 29 (74%) - Right ED: 29 (67%)\n",
      "     Right 29     Correct: NOT Waterfront terrace.     Incorrect: NOT Shiny metal coins scattered on a table.\n",
      "78 - Left ED: 30 (88%) - Right ED: 30 (78%)\n",
      "79 - Left ED: 18 (81%) - Right ED: 18 (69%)\n",
      "     Right 18     Correct: NOT Pictures of bananas.     Incorrect: NOT A threaded light bulb.\n",
      "80 - Left ED: 20 (90%) - Right ED: 20 (76%)\n",
      "81 - Left ED: 26 (83%) - Right ED: 26 (74%)\n",
      "82 - Left ED: 23 (58%) - Right ED: 23 (53%)\n",
      "     Left 23     Correct: Live coral on the sea floor.     Incorrect: A bunch of branches on the green plant.\n",
      "     Right 23     Correct: NOT Live coral on the sea floor.     Incorrect: NOT A bunch of branches on the green plant.\n",
      "83 - Left ED: 26 (70%) - Right ED: 26 (63%)\n",
      "     Right 26     Correct: NOT A handbag hanging somewhere.     Incorrect: NOT A group photo at a wedding reception.\n",
      "84 - Left ED: 31 (73%) - Right ED: 31 (67%)\n",
      "     Right 31     Correct: NOT A wooden fence surrounding a grassy field.     Incorrect: NOT A pile of rusty metal bolts.\n",
      "85 - Left ED: 21 (70%) - Right ED: 21 (61%)\n",
      "     Right 21     Correct: NOT A building with stone columns.     Incorrect: NOT A large wheat field.\n",
      "86 - Left ED: 20 (76%) - Right ED: 20 (66%)\n",
      "     Right 20     Correct: NOT A transparent glass.     Incorrect: NOT Rubber kayak in the water.\n",
      "87 - Left ED: 24 (80%) - Right ED: 24 (70%)\n",
      "88 - Left ED: 25 (69%) - Right ED: 25 (62%)\n",
      "     Left 25     Correct: Boats sailing on a serene lake.     Incorrect: A perched mantis hanging on a plant.\n",
      "     Right 25     Correct: NOT Boats sailing on a serene lake.     Incorrect: NOT A perched mantis hanging on a plant.\n",
      "89 - Left ED: 26 (70%) - Right ED: 26 (63%)\n",
      "     Right 26     Correct: NOT A person holding a camera.     Incorrect: NOT A group photo of the extended family.\n",
      "90 - Left ED: 15 (78%) - Right ED: 15 (65%)\n",
      "     Right 15     Correct: NOT Knitted sweater.     Incorrect: NOT Ellipsoidal fruits.\n",
      "91 - Left ED: 17 (80%) - Right ED: 17 (68%)\n",
      "     Right 17     Correct: NOT Red bows.     Incorrect: NOT An old style bicycle.\n",
      "92 - Left ED: 18 (81%) - Right ED: 18 (69%)\n",
      "     Right 18     Correct: NOT A heart shaped symbol.     Incorrect: NOT Stamp pictures.\n",
      "93 - Left ED: 31 (72%) - Right ED: 31 (65%)\n",
      "     Right 31     Correct: NOT A row of red wine bottles.     Incorrect: NOT Branches covered with heavily falling snow.\n",
      "94 - Left ED: 20 (76%) - Right ED: 20 (66%)\n",
      "     Right 20     Correct: NOT Tennis racket or court.     Incorrect: NOT A person playing a guitar.\n",
      "95 - Left ED: 23 (79%) - Right ED: 23 (69%)\n",
      "     Right 23     Correct: NOT A man is training at the gym.     Incorrect: NOT Bright red fish.\n",
      "96 - Left ED: 23 (76%) - Right ED: 23 (67%)\n",
      "     Right 23     Correct: NOT Keyboard of an old typewriter.     Incorrect: NOT Reeds swaying in the wind.\n",
      "97 - Left ED: 33 (78%) - Right ED: 33 (71%)\n",
      "98 - Left ED: 26 (76%) - Right ED: 26 (68%)\n",
      "     Right 26     Correct: NOT A woman in a red dress is dancing.     Incorrect: NOT Various colors of pigments.\n",
      "99 - Left ED: 61 (82%) - Right ED: 61 (78%)\n"
     ]
    }
   ],
   "execution_count": 4
  },
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-08-01T16:53:33.489090Z",
     "start_time": "2024-08-01T16:53:33.475953Z"
    }
   },
   "cell_type": "code",
   "source": [
    "lcs_warning_threshold = 2\n",
    "for i, (correct_concepts, incorrect_concepts) in enumerate(zip(correct, incorrect)):\n",
    "    left_lcs = get_longest_common_word_subsequence_length(correct_concepts[0], incorrect_concepts[0])\n",
    "    right_lcs = get_longest_common_word_subsequence_length(correct_concepts[1], incorrect_concepts[1])\n",
    "    left_ratio = left_lcs / min(len(correct_concepts[0]), len(incorrect_concepts[0]))\n",
    "    right_ratio = right_lcs / min(len(correct_concepts[1]), len(incorrect_concepts[1]))\n",
    "    print(\n",
    "        i,\n",
    "        \"-\",\n",
    "        f\"Left LCS: {left_lcs} ({int(left_ratio * 100)}%)\",\n",
    "        \"-\",\n",
    "        f\"Right LCS: {right_lcs} ({int(right_ratio * 100)}%)\",\n",
    "    )\n",
    "    if left_lcs >= lcs_warning_threshold:\n",
    "        print(\"    \", \"Left\", \"    Correct:\", correct_concepts[0], \"    Incorrect:\", incorrect_concepts[0])\n",
    "    if right_lcs >= lcs_warning_threshold:\n",
    "        print(\"    \", \"Right\", \"    Correct:\", correct_concepts[1], \"    Incorrect:\", incorrect_concepts[1])"
   ],
   "id": "63909c20db8a3c35",
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "1 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "2 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "3 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "4 - Left LCS: 2 (7%) - Right LCS: 3 (9%)\n",
      "     Left     Correct: A pile of rusty metal bolts.     Incorrect: The top of a snow covered mountain.\n",
      "     Right     Correct: NOT A pile of rusty metal bolts.     Incorrect: NOT The top of a snow covered mountain.\n",
      "5 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "6 - Left LCS: 1 (3%) - Right LCS: 2 (6%)\n",
      "     Right     Correct: NOT Rubber kayak in the water.     Incorrect: NOT People walking on the city street.\n",
      "7 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "8 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "9 - Left LCS: 0 (0%) - Right LCS: 1 (2%)\n",
      "10 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "11 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "12 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "13 - Left LCS: 0 (0%) - Right LCS: 1 (2%)\n",
      "14 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "15 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "16 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "17 - Left LCS: 0 (0%) - Right LCS: 1 (2%)\n",
      "18 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "19 - Left LCS: 1 (6%) - Right LCS: 2 (10%)\n",
      "     Right     Correct: NOT Candle chandeliers hanging above a dining room table surrounded by chairs.     Incorrect: NOT A handicap sign.\n",
      "20 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "21 - Left LCS: 1 (3%) - Right LCS: 2 (5%)\n",
      "     Right     Correct: NOT Cars on the city streets at night.     Incorrect: NOT Fishing boats docked at the pier.\n",
      "22 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "23 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "24 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "25 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "26 - Left LCS: 2 (6%) - Right LCS: 3 (8%)\n",
      "     Left     Correct: People walking on the city street.     Incorrect: Traces left on the sand dunes.\n",
      "     Right     Correct: NOT People walking on the city street.     Incorrect: NOT Traces left on the sand dunes.\n",
      "27 - Left LCS: 1 (3%) - Right LCS: 2 (5%)\n",
      "     Right     Correct: NOT A christmas ornament tree with colorful lights.     Incorrect: NOT A closeup of a red brick wall.\n",
      "28 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "29 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "30 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "31 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "32 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "33 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "34 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "35 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "36 - Left LCS: 0 (0%) - Right LCS: 1 (2%)\n",
      "37 - Left LCS: 1 (3%) - Right LCS: 2 (6%)\n",
      "     Right     Correct: NOT The girl has long and thin braids on her head.     Incorrect: NOT An aerial view of the city.\n",
      "38 - Left LCS: 1 (2%) - Right LCS: 2 (4%)\n",
      "     Right     Correct: NOT Human footprints in the sand on the beach.     Incorrect: NOT Huge crystal chandelier hanging from the ceiling.\n",
      "39 - Left LCS: 1 (6%) - Right LCS: 2 (10%)\n",
      "     Right     Correct: NOT A handicap sign.     Incorrect: NOT A little girl in a princess costume.\n",
      "40 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "41 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "42 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "43 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "44 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "45 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "46 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "47 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "48 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "49 - Left LCS: 1 (3%) - Right LCS: 2 (6%)\n",
      "     Right     Correct: NOT A soldier with a little girl.     Incorrect: NOT A person doing yoga in the wilderness.\n",
      "50 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "51 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "52 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "53 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "54 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "55 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "56 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "57 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "58 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "59 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "60 - Left LCS: 1 (4%) - Right LCS: 2 (7%)\n",
      "     Right     Correct: NOT A mesmerizing light show at the concert.     Incorrect: NOT A closeup view of cat.\n",
      "61 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "62 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "63 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "64 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "65 - Left LCS: 1 (3%) - Right LCS: 2 (6%)\n",
      "     Right     Correct: NOT A warning board in the wild.     Incorrect: NOT A building with stone columns.\n",
      "66 - Left LCS: 1 (5%) - Right LCS: 2 (8%)\n",
      "     Right     Correct: NOT A pile of bullet shells.     Incorrect: NOT A transparent glass.\n",
      "67 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "68 - Left LCS: 1 (3%) - Right LCS: 2 (5%)\n",
      "     Right     Correct: NOT A geometric painting in the style of abstractionist.     Incorrect: NOT Boats sailing on a serene lake.\n",
      "69 - Left LCS: 2 (7%) - Right LCS: 3 (10%)\n",
      "     Left     Correct: A person doing yoga in the wilderness.     Incorrect: A person holding a camera.\n",
      "     Right     Correct: NOT A person doing yoga in the wilderness.     Incorrect: NOT A person holding a camera.\n",
      "70 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "71 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "72 - Left LCS: 1 (4%) - Right LCS: 2 (7%)\n",
      "     Right     Correct: NOT A little girl dressed in a butterfly costume.     Incorrect: NOT A heart shaped symbol.\n",
      "73 - Left LCS: 2 (7%) - Right LCS: 3 (10%)\n",
      "     Left     Correct: A group of sheep grazing on a field of green grass.     Incorrect: A row of red wine bottles.\n",
      "     Right     Correct: NOT A group of sheep grazing on a field of green grass.     Incorrect: NOT A row of red wine bottles.\n",
      "74 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "75 - Left LCS: 1 (4%) - Right LCS: 2 (7%)\n",
      "     Right     Correct: NOT A girl leading a horse.     Incorrect: NOT A man is training at the gym.\n",
      "76 - Left LCS: 1 (4%) - Right LCS: 2 (7%)\n",
      "     Right     Correct: NOT Various kinds of rings.     Incorrect: NOT Keyboard of an old typewriter.\n",
      "77 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "78 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "79 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "80 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "81 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "82 - Left LCS: 2 (7%) - Right LCS: 3 (9%)\n",
      "     Left     Correct: Live coral on the sea floor.     Incorrect: A bunch of branches on the green plant.\n",
      "     Right     Correct: NOT Live coral on the sea floor.     Incorrect: NOT A bunch of branches on the green plant.\n",
      "83 - Left LCS: 1 (3%) - Right LCS: 2 (6%)\n",
      "     Right     Correct: NOT A handbag hanging somewhere.     Incorrect: NOT A group photo at a wedding reception.\n",
      "84 - Left LCS: 1 (3%) - Right LCS: 2 (6%)\n",
      "     Right     Correct: NOT A wooden fence surrounding a grassy field.     Incorrect: NOT A pile of rusty metal bolts.\n",
      "85 - Left LCS: 1 (5%) - Right LCS: 2 (8%)\n",
      "     Right     Correct: NOT A building with stone columns.     Incorrect: NOT A large wheat field.\n",
      "86 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "87 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "88 - Left LCS: 2 (6%) - Right LCS: 3 (8%)\n",
      "     Left     Correct: Boats sailing on a serene lake.     Incorrect: A perched mantis hanging on a plant.\n",
      "     Right     Correct: NOT Boats sailing on a serene lake.     Incorrect: NOT A perched mantis hanging on a plant.\n",
      "89 - Left LCS: 1 (3%) - Right LCS: 2 (6%)\n",
      "     Right     Correct: NOT A person holding a camera.     Incorrect: NOT A group photo of the extended family.\n",
      "90 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "91 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "92 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "93 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "94 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "95 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "96 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "97 - Left LCS: 0 (0%) - Right LCS: 1 (2%)\n",
      "98 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "99 - Left LCS: 1 (4%) - Right LCS: 2 (7%)\n",
      "     Right     Correct: NOT A threaded light bulb.     Incorrect: NOT Candle chandeliers hanging above a dining room table surrounded by chairs.\n"
     ]
    }
   ],
   "execution_count": 5
  },
  {
   "metadata": {},
   "cell_type": "markdown",
   "source": "## Bongard HOI",
   "id": "673e32c8b5394a4b"
  },
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-08-04T16:43:28.681202Z",
     "start_time": "2024-08-04T16:43:28.664105Z"
    }
   },
   "cell_type": "code",
   "source": [
    "rules = pd.read_csv(\"../data/raw/bongard_hoi_mix_labels.csv\")[[\"Left-side Rule\", \"Right-side Rule\"]].values\n",
    "rules"
   ],
   "id": "6fa2f3bc0c25a38c",
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([['swing tennis_racket', 'NOT swing tennis_racket'],\n",
       "       ['throw frisbee', 'NOT throw frisbee'],\n",
       "       ['brush_with toothbrush', 'NOT brush_with toothbrush'],\n",
       "       ['point_at_camera remote', 'NOT point_at_camera remote'],\n",
       "       ['use mouse', 'NOT use mouse'],\n",
       "       ['shear sheep', 'NOT shear sheep'],\n",
       "       ['wear tie', 'NOT wear tie'],\n",
       "       ['adjust_or_tie tie', 'NOT adjust_or_tie tie'],\n",
       "       ['help_adjust_or_tie tie', 'NOT help_adjust_or_tie tie'],\n",
       "       ['smell apple', 'NOT smell apple'],\n",
       "       ['hold_and_about_to_eat apple', 'NOT hold_and_about_to_eat apple'],\n",
       "       ['pick apple', 'NOT pick apple'],\n",
       "       ['peel_or_cut apple', 'NOT peel_or_cut apple'],\n",
       "       ['sit_on_with_multiple_person bench',\n",
       "        'NOT sit_on_with_multiple_person bench'],\n",
       "       ['stand_on chair', 'NOT stand_on chair'],\n",
       "       ['lie_on_like chair', 'NOT lie_on_like chair'],\n",
       "       ['eat orange', 'NOT eat orange'],\n",
       "       ['squeeze orange', 'NOT squeeze orange'],\n",
       "       ['peel orange', 'NOT peel orange'],\n",
       "       ['hold orange', 'NOT hold orange'],\n",
       "       ['sit_on toilet', 'NOT sit_on toilet'],\n",
       "       ['clean toilet', 'NOT clean toilet'],\n",
       "       ['hold carrot', 'NOT hold carrot'],\n",
       "       ['hold wine_glass', 'NOT hold wine_glass'],\n",
       "       ['sip wine_glass', 'NOT sip wine_glass'],\n",
       "       ['drive car', 'NOT drive car'],\n",
       "       ['wash car', 'NOT wash car'],\n",
       "       ['pet cat', 'NOT pet cat'],\n",
       "       ['hug cat', 'NOT hug cat'],\n",
       "       ['drive train', 'NOT drive train'],\n",
       "       ['ride boat', 'NOT ride boat'],\n",
       "       ['sail boat', 'NOT sail boat'],\n",
       "       ['drive boat', 'NOT drive boat'],\n",
       "       ['sit_on airplane', 'NOT sit_on airplane'],\n",
       "       ['control tv', 'NOT control tv'],\n",
       "       ['watch tv', 'NOT watch tv'],\n",
       "       ['hold person', 'NOT hold person'],\n",
       "       ['kiss person', 'NOT kiss person'],\n",
       "       ['hug person', 'NOT hug person'],\n",
       "       ['cut_with knife', 'NOT cut_with knife'],\n",
       "       ['clean refrigerator', 'NOT clean refrigerator'],\n",
       "       ['open refrigerator', 'NOT open refrigerator'],\n",
       "       ['fly kite', 'NOT fly kite'],\n",
       "       ['hold kite', 'NOT hold kite'],\n",
       "       ['type_on laptop', 'NOT type_on laptop'],\n",
       "       ['hold laptop', 'NOT hold laptop'],\n",
       "       ['repair laptop', 'NOT repair laptop'],\n",
       "       ['walk cow', 'NOT walk cow'],\n",
       "       ['cut cake', 'NOT cut cake'],\n",
       "       ['hold cake', 'NOT hold cake'],\n",
       "       ['blow cake', 'NOT blow cake'],\n",
       "       ['hold donut', 'NOT hold donut'],\n",
       "       ['hold tennis_racket', 'NOT hold tennis_racket'],\n",
       "       ['catch frisbee', 'NOT catch frisbee'],\n",
       "       ['hold frisbee', 'NOT hold frisbee'],\n",
       "       ['hold toothbrush', 'NOT hold toothbrush'],\n",
       "       ['hold remote', 'NOT hold remote'],\n",
       "       ['hold fork', 'NOT hold fork'],\n",
       "       ['hold mouse', 'NOT hold mouse'],\n",
       "       ['sit_on couch', 'NOT sit_on couch'],\n",
       "       ['lie_on couch', 'NOT lie_on couch'],\n",
       "       ['feed sheep', 'NOT feed sheep'],\n",
       "       ['pet sheep', 'NOT pet sheep'],\n",
       "       ['hold sheep', 'NOT hold sheep'],\n",
       "       ['carry handbag', 'NOT carry handbag'],\n",
       "       ['hold handbag', 'NOT hold handbag'],\n",
       "       ['ride surfboard', 'NOT ride surfboard'],\n",
       "       ['lie_on surfboard', 'NOT lie_on surfboard'],\n",
       "       ['carry surfboard', 'NOT carry surfboard'],\n",
       "       ['inspect surfboard', 'NOT inspect surfboard'],\n",
       "       ['jump surfboard', 'NOT jump surfboard'],\n",
       "       ['hold scissors', 'NOT hold scissors'],\n",
       "       ['cut_with scissors', 'NOT cut_with scissors'],\n",
       "       ['eat apple', 'NOT eat apple'],\n",
       "       ['hold apple', 'NOT hold apple'],\n",
       "       ['wash apple', 'NOT wash apple'],\n",
       "       ['sit_on bench', 'NOT sit_on bench'],\n",
       "       ['lie_on bench', 'NOT lie_on bench'],\n",
       "       ['sit_on chair', 'NOT sit_on chair'],\n",
       "       ['toast wine_glass', 'NOT toast wine_glass'],\n",
       "       ['board train', 'NOT board train'],\n",
       "       ['stand_on boat', 'NOT stand_on boat'],\n",
       "       ['row boat', 'NOT row boat'],\n",
       "       ['direct airplane', 'NOT direct airplane'],\n",
       "       ['greet person', 'NOT greet person'],\n",
       "       ['lick knife', 'NOT lick knife'],\n",
       "       ['wield knife', 'NOT wield knife'],\n",
       "       ['stick knife', 'NOT stick knife'],\n",
       "       ['read laptop', 'NOT read laptop'],\n",
       "       ['milk cow', 'NOT milk cow'],\n",
       "       ['grind snowboard', 'NOT grind snowboard'],\n",
       "       ['release bird', 'NOT release bird'],\n",
       "       ['grind skateboard', 'NOT grind skateboard'],\n",
       "       ['hold_and_about_to_eat banana',\n",
       "        'NOT hold_and_about_to_eat banana'],\n",
       "       ['train dog', 'NOT train dog'],\n",
       "       ['sit_inside bus', 'NOT sit_inside bus'],\n",
       "       ['block sports_ball', 'NOT block sports_ball'],\n",
       "       ['serve sports_ball', 'NOT serve sports_ball'],\n",
       "       ['turn motorcycle', 'NOT turn motorcycle'],\n",
       "       ['push motorcycle', 'NOT push motorcycle']], dtype=object)"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "execution_count": 2
  },
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-08-04T16:43:35.784948Z",
     "start_time": "2024-08-04T16:43:35.778224Z"
    }
   },
   "cell_type": "code",
   "source": [
    "offset = 20\n",
    "correct = rules[0:100]\n",
    "incorrect = np.concatenate((rules[offset:100], rules[0:offset]), axis=0)\n",
    "correct.shape, incorrect.shape"
   ],
   "id": "2b9869e8cbc9001a",
   "outputs": [
    {
     "data": {
      "text/plain": [
       "((100, 2), (100, 2))"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "execution_count": 3
  },
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-08-04T16:43:37.563480Z",
     "start_time": "2024-08-04T16:43:37.548119Z"
    }
   },
   "cell_type": "code",
   "source": [
    "edit_distance_ratio_warning_threshold = 0.7\n",
    "for i, (correct_concepts, incorrect_concepts) in enumerate(zip(correct, incorrect)):\n",
    "    left_distance = editdistance.eval(correct_concepts[0], incorrect_concepts[0])\n",
    "    right_distance = editdistance.eval(correct_concepts[1], incorrect_concepts[1])\n",
    "    left_ratio = left_distance / max(len(correct_concepts[0]), len(incorrect_concepts[0]))\n",
    "    right_ratio = right_distance / max(len(correct_concepts[1]), len(incorrect_concepts[1]))\n",
    "    print(\n",
    "        i,\n",
    "        \"-\",\n",
    "        f\"Left ED: {left_distance:02d} ({int(left_ratio * 100)}%)\",\n",
    "        \"-\",\n",
    "        f\"Right ED: {right_distance:02d} ({int(right_ratio * 100)}%)\",\n",
    "    )\n",
    "    if left_ratio < edit_distance_ratio_warning_threshold:\n",
    "        print(\"    \", \"Left\", left_distance, \"    Correct:\", correct_concepts[0], \"    Incorrect:\", incorrect_concepts[0])\n",
    "    if right_ratio < edit_distance_ratio_warning_threshold:\n",
    "        print(\"    \", \"Right\", right_distance, \"    Correct:\", correct_concepts[1], \"    Incorrect:\", incorrect_concepts[1])"
   ],
   "id": "c877317807b3b03f",
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 - Left ED: 13 (68%) - Right ED: 13 (56%)\n",
      "     Left 13     Correct: swing tennis_racket     Incorrect: sit_on toilet\n",
      "     Right 13     Correct: NOT swing tennis_racket     Incorrect: NOT sit_on toilet\n",
      "1 - Left ED: 10 (76%) - Right ED: 10 (58%)\n",
      "     Right 10     Correct: NOT throw frisbee     Incorrect: NOT clean toilet\n",
      "2 - Left ED: 18 (85%) - Right ED: 18 (72%)\n",
      "3 - Left ED: 20 (90%) - Right ED: 20 (76%)\n",
      "4 - Left ED: 12 (85%) - Right ED: 12 (66%)\n",
      "     Right 12     Correct: NOT use mouse     Incorrect: NOT sip wine_glass\n",
      "5 - Left ED: 10 (90%) - Right ED: 10 (66%)\n",
      "     Right 10     Correct: NOT shear sheep     Incorrect: NOT drive car\n",
      "6 - Left ED: 06 (75%) - Right ED: 06 (50%)\n",
      "     Right 6     Correct: NOT wear tie     Incorrect: NOT wash car\n",
      "7 - Left ED: 15 (88%) - Right ED: 15 (71%)\n",
      "8 - Left ED: 19 (86%) - Right ED: 19 (73%)\n",
      "9 - Left ED: 10 (90%) - Right ED: 10 (66%)\n",
      "     Right 10     Correct: NOT smell apple     Incorrect: NOT drive train\n",
      "10 - Left ED: 22 (81%) - Right ED: 22 (70%)\n",
      "11 - Left ED: 09 (90%) - Right ED: 09 (64%)\n",
      "     Right 9     Correct: NOT pick apple     Incorrect: NOT sail boat\n",
      "12 - Left ED: 15 (88%) - Right ED: 15 (71%)\n",
      "13 - Left ED: 22 (66%) - Right ED: 22 (59%)\n",
      "     Left 22     Correct: sit_on_with_multiple_person bench     Incorrect: sit_on airplane\n",
      "     Right 22     Correct: NOT sit_on_with_multiple_person bench     Incorrect: NOT sit_on airplane\n",
      "14 - Left ED: 11 (78%) - Right ED: 11 (61%)\n",
      "     Right 11     Correct: NOT stand_on chair     Incorrect: NOT control tv\n",
      "15 - Left ED: 15 (88%) - Right ED: 15 (71%)\n",
      "16 - Left ED: 10 (90%) - Right ED: 10 (66%)\n",
      "     Right 10     Correct: NOT eat orange     Incorrect: NOT hold person\n",
      "17 - Left ED: 12 (85%) - Right ED: 12 (66%)\n",
      "     Right 12     Correct: NOT squeeze orange     Incorrect: NOT kiss person\n",
      "18 - Left ED: 10 (90%) - Right ED: 10 (66%)\n",
      "     Right 10     Correct: NOT peel orange     Incorrect: NOT hug person\n",
      "19 - Left ED: 12 (85%) - Right ED: 12 (66%)\n",
      "     Right 12     Correct: NOT hold orange     Incorrect: NOT cut_with knife\n",
      "20 - Left ED: 14 (77%) - Right ED: 14 (63%)\n",
      "     Right 14     Correct: NOT sit_on toilet     Incorrect: NOT clean refrigerator\n",
      "21 - Left ED: 12 (70%) - Right ED: 12 (57%)\n",
      "     Right 12     Correct: NOT clean toilet     Incorrect: NOT open refrigerator\n",
      "22 - Left ED: 09 (81%) - Right ED: 09 (60%)\n",
      "     Right 9     Correct: NOT hold carrot     Incorrect: NOT fly kite\n",
      "23 - Left ED: 08 (53%) - Right ED: 08 (42%)\n",
      "     Left 8     Correct: hold wine_glass     Incorrect: hold kite\n",
      "     Right 8     Correct: NOT hold wine_glass     Incorrect: NOT hold kite\n",
      "24 - Left ED: 12 (85%) - Right ED: 12 (66%)\n",
      "     Right 12     Correct: NOT sip wine_glass     Incorrect: NOT type_on laptop\n",
      "25 - Left ED: 10 (90%) - Right ED: 10 (66%)\n",
      "     Right 10     Correct: NOT drive car     Incorrect: NOT hold laptop\n",
      "26 - Left ED: 10 (76%) - Right ED: 10 (58%)\n",
      "     Right 10     Correct: NOT wash car     Incorrect: NOT repair laptop\n",
      "27 - Left ED: 06 (75%) - Right ED: 06 (50%)\n",
      "     Right 6     Correct: NOT pet cat     Incorrect: NOT walk cow\n",
      "28 - Left ED: 04 (50%) - Right ED: 04 (33%)\n",
      "     Left 4     Correct: hug cat     Incorrect: cut cake\n",
      "     Right 4     Correct: NOT hug cat     Incorrect: NOT cut cake\n",
      "29 - Left ED: 09 (81%) - Right ED: 09 (60%)\n",
      "     Right 9     Correct: NOT drive train     Incorrect: NOT hold cake\n",
      "30 - Left ED: 08 (88%) - Right ED: 08 (61%)\n",
      "     Right 8     Correct: NOT ride boat     Incorrect: NOT blow cake\n",
      "31 - Left ED: 07 (70%) - Right ED: 07 (50%)\n",
      "     Right 7     Correct: NOT sail boat     Incorrect: NOT hold donut\n",
      "32 - Left ED: 15 (83%) - Right ED: 15 (68%)\n",
      "     Right 15     Correct: NOT drive boat     Incorrect: NOT hold tennis_racket\n",
      "33 - Left ED: 11 (73%) - Right ED: 11 (57%)\n",
      "     Right 11     Correct: NOT sit_on airplane     Incorrect: NOT catch frisbee\n",
      "34 - Left ED: 10 (83%) - Right ED: 10 (62%)\n",
      "     Right 10     Correct: NOT control tv     Incorrect: NOT hold frisbee\n",
      "35 - Left ED: 13 (86%) - Right ED: 13 (68%)\n",
      "     Right 13     Correct: NOT watch tv     Incorrect: NOT hold toothbrush\n",
      "36 - Left ED: 05 (45%) - Right ED: 05 (33%)\n",
      "     Left 5     Correct: hold person     Incorrect: hold remote\n",
      "     Right 5     Correct: NOT hold person     Incorrect: NOT hold remote\n",
      "37 - Left ED: 09 (81%) - Right ED: 09 (60%)\n",
      "     Right 9     Correct: NOT kiss person     Incorrect: NOT hold fork\n",
      "38 - Left ED: 08 (80%) - Right ED: 08 (57%)\n",
      "     Right 8     Correct: NOT hug person     Incorrect: NOT hold mouse\n",
      "39 - Left ED: 11 (78%) - Right ED: 11 (61%)\n",
      "     Right 11     Correct: NOT cut_with knife     Incorrect: NOT sit_on couch\n",
      "40 - Left ED: 16 (88%) - Right ED: 16 (72%)\n",
      "41 - Left ED: 14 (82%) - Right ED: 14 (66%)\n",
      "     Right 14     Correct: NOT open refrigerator     Incorrect: NOT feed sheep\n",
      "42 - Left ED: 07 (77%) - Right ED: 07 (53%)\n",
      "     Right 7     Correct: NOT fly kite     Incorrect: NOT pet sheep\n",
      "43 - Left ED: 04 (40%) - Right ED: 04 (28%)\n",
      "     Left 4     Correct: hold kite     Incorrect: hold sheep\n",
      "     Right 4     Correct: NOT hold kite     Incorrect: NOT hold sheep\n",
      "44 - Left ED: 13 (92%) - Right ED: 13 (72%)\n",
      "45 - Left ED: 06 (50%) - Right ED: 06 (37%)\n",
      "     Left 6     Correct: hold laptop     Incorrect: hold handbag\n",
      "     Right 6     Correct: NOT hold laptop     Incorrect: NOT hold handbag\n",
      "46 - Left ED: 12 (85%) - Right ED: 12 (66%)\n",
      "     Right 12     Correct: NOT repair laptop     Incorrect: NOT ride surfboard\n",
      "47 - Left ED: 14 (87%) - Right ED: 14 (70%)\n",
      "48 - Left ED: 12 (80%) - Right ED: 12 (63%)\n",
      "     Right 12     Correct: NOT cut cake     Incorrect: NOT carry surfboard\n",
      "49 - Left ED: 15 (88%) - Right ED: 15 (71%)\n",
      "50 - Left ED: 12 (85%) - Right ED: 12 (66%)\n",
      "     Right 12     Correct: NOT blow cake     Incorrect: NOT jump surfboard\n",
      "51 - Left ED: 08 (61%) - Right ED: 08 (47%)\n",
      "     Left 8     Correct: hold donut     Incorrect: hold scissors\n",
      "     Right 8     Correct: NOT hold donut     Incorrect: NOT hold scissors\n",
      "52 - Left ED: 17 (94%) - Right ED: 17 (77%)\n",
      "53 - Left ED: 09 (69%) - Right ED: 09 (52%)\n",
      "     Left 9     Correct: catch frisbee     Incorrect: eat apple\n",
      "     Right 9     Correct: NOT catch frisbee     Incorrect: NOT eat apple\n",
      "54 - Left ED: 06 (50%) - Right ED: 06 (37%)\n",
      "     Left 6     Correct: hold frisbee     Incorrect: hold apple\n",
      "     Right 6     Correct: NOT hold frisbee     Incorrect: NOT hold apple\n",
      "55 - Left ED: 14 (93%) - Right ED: 14 (73%)\n",
      "56 - Left ED: 11 (91%) - Right ED: 11 (68%)\n",
      "     Right 11     Correct: NOT hold remote     Incorrect: NOT sit_on bench\n",
      "57 - Left ED: 11 (91%) - Right ED: 11 (68%)\n",
      "     Right 11     Correct: NOT hold fork     Incorrect: NOT lie_on bench\n",
      "58 - Left ED: 11 (91%) - Right ED: 11 (68%)\n",
      "     Right 11     Correct: NOT hold mouse     Incorrect: NOT sit_on chair\n",
      "59 - Left ED: 14 (87%) - Right ED: 14 (70%)\n",
      "60 - Left ED: 11 (91%) - Right ED: 11 (68%)\n",
      "     Right 11     Correct: NOT lie_on couch     Incorrect: NOT board train\n",
      "61 - Left ED: 12 (92%) - Right ED: 12 (70%)\n",
      "62 - Left ED: 08 (88%) - Right ED: 08 (61%)\n",
      "     Right 8     Correct: NOT pet sheep     Incorrect: NOT row boat\n",
      "63 - Left ED: 14 (93%) - Right ED: 14 (73%)\n",
      "64 - Left ED: 12 (92%) - Right ED: 12 (70%)\n",
      "65 - Left ED: 10 (83%) - Right ED: 10 (62%)\n",
      "     Right 10     Correct: NOT hold handbag     Incorrect: NOT lick knife\n",
      "66 - Left ED: 12 (85%) - Right ED: 12 (66%)\n",
      "     Right 12     Correct: NOT ride surfboard     Incorrect: NOT wield knife\n",
      "67 - Left ED: 14 (87%) - Right ED: 14 (70%)\n",
      "68 - Left ED: 13 (86%) - Right ED: 13 (68%)\n",
      "     Right 13     Correct: NOT carry surfboard     Incorrect: NOT read laptop\n",
      "69 - Left ED: 15 (88%) - Right ED: 15 (71%)\n",
      "70 - Left ED: 08 (53%) - Right ED: 08 (42%)\n",
      "     Left 8     Correct: jump surfboard     Incorrect: grind snowboard\n",
      "     Right 8     Correct: NOT jump surfboard     Incorrect: NOT grind snowboard\n",
      "71 - Left ED: 10 (76%) - Right ED: 10 (58%)\n",
      "     Right 10     Correct: NOT hold scissors     Incorrect: NOT release bird\n",
      "72 - Left ED: 14 (82%) - Right ED: 14 (66%)\n",
      "     Right 14     Correct: NOT cut_with scissors     Incorrect: NOT grind skateboard\n",
      "73 - Left ED: 23 (82%) - Right ED: 23 (71%)\n",
      "74 - Left ED: 10 (100%) - Right ED: 10 (71%)\n",
      "75 - Left ED: 13 (92%) - Right ED: 13 (72%)\n",
      "76 - Left ED: 16 (94%) - Right ED: 16 (76%)\n",
      "77 - Left ED: 15 (88%) - Right ED: 15 (71%)\n",
      "78 - Left ED: 13 (86%) - Right ED: 13 (68%)\n",
      "     Right 13     Correct: NOT sit_on chair     Incorrect: NOT turn motorcycle\n",
      "79 - Left ED: 14 (87%) - Right ED: 14 (70%)\n",
      "80 - Left ED: 15 (78%) - Right ED: 15 (65%)\n",
      "     Right 15     Correct: NOT board train     Incorrect: NOT swing tennis_racket\n",
      "81 - Left ED: 13 (100%) - Right ED: 13 (76%)\n",
      "82 - Left ED: 16 (76%) - Right ED: 16 (64%)\n",
      "     Right 16     Correct: NOT row boat     Incorrect: NOT brush_with toothbrush\n",
      "83 - Left ED: 17 (77%) - Right ED: 17 (65%)\n",
      "     Right 17     Correct: NOT direct airplane     Incorrect: NOT point_at_camera remote\n",
      "84 - Left ED: 09 (75%) - Right ED: 09 (56%)\n",
      "     Right 9     Correct: NOT greet person     Incorrect: NOT use mouse\n",
      "85 - Left ED: 10 (90%) - Right ED: 10 (66%)\n",
      "     Right 10     Correct: NOT lick knife     Incorrect: NOT shear sheep\n",
      "86 - Left ED: 06 (54%) - Right ED: 06 (40%)\n",
      "     Left 6     Correct: wield knife     Incorrect: wear tie\n",
      "     Right 6     Correct: NOT wield knife     Incorrect: NOT wear tie\n",
      "87 - Left ED: 14 (82%) - Right ED: 14 (66%)\n",
      "     Right 14     Correct: NOT stick knife     Incorrect: NOT adjust_or_tie tie\n",
      "88 - Left ED: 18 (81%) - Right ED: 18 (69%)\n",
      "     Right 18     Correct: NOT read laptop     Incorrect: NOT help_adjust_or_tie tie\n",
      "89 - Left ED: 08 (72%) - Right ED: 08 (53%)\n",
      "     Right 8     Correct: NOT milk cow     Incorrect: NOT smell apple\n",
      "90 - Left ED: 22 (81%) - Right ED: 22 (70%)\n",
      "91 - Left ED: 12 (100%) - Right ED: 12 (75%)\n",
      "92 - Left ED: 16 (94%) - Right ED: 16 (76%)\n",
      "93 - Left ED: 26 (78%) - Right ED: 26 (70%)\n",
      "94 - Left ED: 11 (78%) - Right ED: 11 (61%)\n",
      "     Right 11     Correct: NOT train dog     Incorrect: NOT stand_on chair\n",
      "95 - Left ED: 11 (64%) - Right ED: 11 (52%)\n",
      "     Left 11     Correct: sit_inside bus     Incorrect: lie_on_like chair\n",
      "     Right 11     Correct: NOT sit_inside bus     Incorrect: NOT lie_on_like chair\n",
      "96 - Left ED: 14 (82%) - Right ED: 14 (66%)\n",
      "     Right 14     Correct: NOT block sports_ball     Incorrect: NOT eat orange\n",
      "97 - Left ED: 13 (76%) - Right ED: 13 (61%)\n",
      "     Right 13     Correct: NOT serve sports_ball     Incorrect: NOT squeeze orange\n",
      "98 - Left ED: 11 (73%) - Right ED: 11 (57%)\n",
      "     Right 11     Correct: NOT turn motorcycle     Incorrect: NOT peel orange\n",
      "99 - Left ED: 11 (73%) - Right ED: 11 (57%)\n",
      "     Right 11     Correct: NOT push motorcycle     Incorrect: NOT hold orange\n"
     ]
    }
   ],
   "execution_count": 4
  },
  {
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-08-04T16:45:54.385091Z",
     "start_time": "2024-08-04T16:45:54.373Z"
    }
   },
   "cell_type": "code",
   "source": [
    "lcs_warning_threshold = 2\n",
    "for i, (correct_concepts, incorrect_concepts) in enumerate(zip(correct, incorrect)):\n",
    "    left_lcs = get_longest_common_word_subsequence_length(correct_concepts[0], incorrect_concepts[0])\n",
    "    right_lcs = get_longest_common_word_subsequence_length(correct_concepts[1], incorrect_concepts[1])\n",
    "    left_ratio = left_lcs / min(len(correct_concepts[0]), len(incorrect_concepts[0]))\n",
    "    right_ratio = right_lcs / min(len(correct_concepts[1]), len(incorrect_concepts[1]))\n",
    "    print(\n",
    "        i,\n",
    "        \"-\",\n",
    "        f\"Left LCS: {left_lcs} ({int(left_ratio * 100)}%)\",\n",
    "        \"-\",\n",
    "        f\"Right LCS: {right_lcs} ({int(right_ratio * 100)}%)\",\n",
    "    )\n",
    "    if left_lcs >= lcs_warning_threshold:\n",
    "        print(\"    \", \"Left\", \"    Correct:\", correct_concepts[0], \"    Incorrect:\", incorrect_concepts[0])\n",
    "    if right_lcs >= lcs_warning_threshold:\n",
    "        print(\"    \", \"Right\", \"    Correct:\", correct_concepts[1], \"    Incorrect:\", incorrect_concepts[1])"
   ],
   "id": "d30e348a2b7c8496",
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "1 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "2 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "3 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "4 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "5 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "6 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "7 - Left LCS: 0 (0%) - Right LCS: 1 (9%)\n",
      "8 - Left LCS: 0 (0%) - Right LCS: 1 (9%)\n",
      "9 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "10 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "11 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "12 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "13 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "14 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "15 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "16 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "17 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "18 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "19 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "20 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "21 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "22 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "23 - Left LCS: 1 (11%) - Right LCS: 2 (15%)\n",
      "     Right     Correct: NOT hold wine_glass     Incorrect: NOT hold kite\n",
      "24 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "25 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "26 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "27 - Left LCS: 0 (0%) - Right LCS: 1 (9%)\n",
      "28 - Left LCS: 0 (0%) - Right LCS: 1 (9%)\n",
      "29 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "30 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "31 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "32 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "33 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "34 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "35 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "36 - Left LCS: 1 (9%) - Right LCS: 2 (13%)\n",
      "     Right     Correct: NOT hold person     Incorrect: NOT hold remote\n",
      "37 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "38 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "39 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "40 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "41 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "42 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "43 - Left LCS: 1 (11%) - Right LCS: 2 (15%)\n",
      "     Right     Correct: NOT hold kite     Incorrect: NOT hold sheep\n",
      "44 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "45 - Left LCS: 1 (9%) - Right LCS: 2 (13%)\n",
      "     Right     Correct: NOT hold laptop     Incorrect: NOT hold handbag\n",
      "46 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "47 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "48 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "49 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "50 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "51 - Left LCS: 1 (10%) - Right LCS: 2 (14%)\n",
      "     Right     Correct: NOT hold donut     Incorrect: NOT hold scissors\n",
      "52 - Left LCS: 0 (0%) - Right LCS: 1 (4%)\n",
      "53 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "54 - Left LCS: 1 (10%) - Right LCS: 2 (14%)\n",
      "     Right     Correct: NOT hold frisbee     Incorrect: NOT hold apple\n",
      "55 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "56 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "57 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "58 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "59 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "60 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "61 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "62 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "63 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "64 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "65 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "66 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "67 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "68 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "69 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "70 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "71 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "72 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "73 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "74 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "75 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "76 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "77 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "78 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "79 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "80 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "81 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "82 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "83 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "84 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "85 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "86 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "87 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "88 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "89 - Left LCS: 0 (0%) - Right LCS: 1 (8%)\n",
      "90 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "91 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "92 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "93 - Left LCS: 0 (0%) - Right LCS: 1 (3%)\n",
      "94 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "95 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "96 - Left LCS: 0 (0%) - Right LCS: 1 (7%)\n",
      "97 - Left LCS: 0 (0%) - Right LCS: 1 (5%)\n",
      "98 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n",
      "99 - Left LCS: 0 (0%) - Right LCS: 1 (6%)\n"
     ]
    }
   ],
   "execution_count": 5
  },
  {
   "metadata": {},
   "cell_type": "code",
   "outputs": [],
   "execution_count": null,
   "source": "",
   "id": "f5bf662600aa6dfe"
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 2
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython2",
   "version": "2.7.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
