[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "dehydrogenation (DH)",
            "oxidation (Ox)",
            "loss of electrons (LE)",
            "deprotonation (DPN)",
            "nitrification (NF)",
            "halogenation (HL)",
            "peroxidation (PO)",
            "dissolution of metal ions (DMI)",
            "photooxidation (POx)",
            "electrochemical oxidation (EOx)",
            "metal ion oxidation (MIO)",
            "autoxidation (AOx)",
            "biological oxidation (BOx)",
            "alkylation (ALK)",
            "desulfurization (DSF)",
            "denitrogenation (DNG)",
            "demethylation (DMT)",
            "decarboxylation (DCB)",
            "deamination (DMA)",
            "dehydroxylation (DHY)",
            "dehalogenation (DHL)",
            "dehydroxylation of alcohols (DHA)",
            "dehydrogenation of aldehydes (DHAld)",
            "dehydrogenation of ketones (DHK)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "dehydrogenation (DH)",
                "oxidation (Ox)",
                "loss of electrons (LE)",
                "deprotonation (DPN)",
                "nitrification (NF)",
                "halogenation (HL)",
                "peroxidation (PO)",
                "dissolution of metal ions (DMI)",
                "photooxidation (POx)",
                "electrochemical oxidation (EOx)",
                "metal ion oxidation (MIO)",
                "autoxidation (AOx)",
                "biological oxidation (BOx)",
                "alkylation (ALK)",
                "desulfurization (DSF)",
                "denitrogenation (DNG)",
                "demethylation (DMT)",
                "decarboxylation (DCB)",
                "deamination (DMA)",
                "dehydroxylation (DHY)",
                "dehalogenation (DHL)",
                "dehydroxylation of alcohols (DHA)",
                "dehydrogenation of aldehydes (DHAld)",
                "dehydrogenation of ketones (DHK)"
            ],
            "mismatches": [],
            "true_referents": [
                "alkylation (ALK)",
                "autoxidation (AOx)",
                "biological oxidation (BOx)",
                "deamination (DMA)",
                "decarboxylation (DCB)",
                "dehalogenation (DHL)",
                "dehydrogenation (DH)",
                "dehydrogenation of aldehydes (DHAld)",
                "dehydrogenation of ketones (DHK)",
                "dehydroxylation (DHY)",
                "dehydroxylation of alcohols (DHA)",
                "demethylation (DMT)",
                "denitrogenation (DNG)",
                "deprotonation (DPN)",
                "desulfurization (DSF)",
                "dissolution of metal ions (DMI)",
                "electrochemical oxidation (EOx)",
                "halogenation (HL)",
                "loss of electrons (LE)",
                "metal ion oxidation (MIO)",
                "nitrification (NF)",
                "oxidation (Ox)",
                "peroxidation (PO)",
                "photooxidation (POx)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Oxidation of glucose in cellular respiration (Glycolysis)",
            "Oxidation of ethanol to acetaldehyde in the liver (Ethanol oxidation)",
            "Oxidation of iron(II) to iron(III) (Ferric oxidation)",
            "Oxidation of sulfur in pyrite to sulfate (Pyrite oxidation)",
            "Oxidation of iodide to iodine (Iodide oxidation)",
            "Oxidation of alcohols to aldehydes or ketones (Alcohol oxidation)",
            "Oxidation of aldehydes to carboxylic acids (Aldehyde oxidation)",
            "Oxidation of ammonia to nitrite in nitrification (Ammonia oxidation)",
            "Oxidation of methane to methanol in methanotrophs (Methane oxidation)",
            "Oxidation of ferrous iron to ferric iron in water treatment (Ferrous oxidation)",
            "Oxidation of sulfide to sulfate in sulfur bacteria (Sulfide oxidation)",
            "Oxidation of carbon monoxide to carbon dioxide (Carbon monoxide oxidation)",
            "Oxidation of hydrogen sulfide to sulfur or sulfate (Hydrogen sulfide oxidation)",
            "Oxidation of nitrogen in the nitrogen cycle (Nitrogen oxidation)",
            "Oxidation of phenols to quinones (Phenol oxidation)",
            "Oxidation of ascorbic acid to dehydroascorbic acid (Ascorbic acid oxidation)",
            "Oxidation of thiol groups to disulfides (Thiol oxidation)",
            "Oxidation of hydrocarbons in combustion (Hydrocarbon oxidation)",
            "Oxidation of glucose to gluconic acid (Gluconic acid formation)",
            "Oxidation of methanol to formaldehyde (Methanol oxidation)",
            "Oxidation of isopropanol to acetone (Isopropanol oxidation)",
            "Oxidation of nitrite to nitrate in nitrification (Nitrite oxidation)",
            "Oxidation of carbon to carbon dioxide in cellular respiration (Carbon oxidation)",
            "Oxidation of hydrogen to water in fuel cells (Hydrogen oxidation)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Oxidation of glucose in cellular respiration (Glycolysis)",
                "Oxidation of ethanol to acetaldehyde in the liver (Ethanol oxidation)",
                "Oxidation of iron(II) to iron(III) (Ferric oxidation)",
                "Oxidation of sulfur in pyrite to sulfate (Pyrite oxidation)",
                "Oxidation of iodide to iodine (Iodide oxidation)",
                "Oxidation of alcohols to aldehydes or ketones (Alcohol oxidation)",
                "Oxidation of aldehydes to carboxylic acids (Aldehyde oxidation)",
                "Oxidation of ammonia to nitrite in nitrification (Ammonia oxidation)",
                "Oxidation of methane to methanol in methanotrophs (Methane oxidation)",
                "Oxidation of ferrous iron to ferric iron in water treatment (Ferrous oxidation)",
                "Oxidation of sulfide to sulfate in sulfur bacteria (Sulfide oxidation)",
                "Oxidation of carbon monoxide to carbon dioxide (Carbon monoxide oxidation)",
                "Oxidation of hydrogen sulfide to sulfur or sulfate (Hydrogen sulfide oxidation)",
                "Oxidation of nitrogen in the nitrogen cycle (Nitrogen oxidation)",
                "Oxidation of phenols to quinones (Phenol oxidation)",
                "Oxidation of ascorbic acid to dehydroascorbic acid (Ascorbic acid oxidation)",
                "Oxidation of thiol groups to disulfides (Thiol oxidation)",
                "Oxidation of hydrocarbons in combustion (Hydrocarbon oxidation)",
                "Oxidation of glucose to gluconic acid (Gluconic acid formation)",
                "Oxidation of methanol to formaldehyde (Methanol oxidation)",
                "Oxidation of isopropanol to acetone (Isopropanol oxidation)",
                "Oxidation of nitrite to nitrate in nitrification (Nitrite oxidation)",
                "Oxidation of carbon to carbon dioxide in cellular respiration (Carbon oxidation)",
                "Oxidation of hydrogen to water in fuel cells (Hydrogen oxidation)"
            ],
            "mismatches": [],
            "true_referents": [
                "Oxidation of alcohols to aldehydes or ketones (Alcohol oxidation)",
                "Oxidation of aldehydes to carboxylic acids (Aldehyde oxidation)",
                "Oxidation of ammonia to nitrite in nitrification (Ammonia oxidation)",
                "Oxidation of ascorbic acid to dehydroascorbic acid (Ascorbic acid oxidation)",
                "Oxidation of carbon monoxide to carbon dioxide (Carbon monoxide oxidation)",
                "Oxidation of carbon to carbon dioxide in cellular respiration (Carbon oxidation)",
                "Oxidation of ethanol to acetaldehyde in the liver (Ethanol oxidation)",
                "Oxidation of ferrous iron to ferric iron in water treatment (Ferrous oxidation)",
                "Oxidation of glucose in cellular respiration (Glycolysis)",
                "Oxidation of glucose to gluconic acid (Gluconic acid formation)",
                "Oxidation of hydrocarbons in combustion (Hydrocarbon oxidation)",
                "Oxidation of hydrogen sulfide to sulfur or sulfate (Hydrogen sulfide oxidation)",
                "Oxidation of hydrogen to water in fuel cells (Hydrogen oxidation)",
                "Oxidation of iodide to iodine (Iodide oxidation)",
                "Oxidation of iron(II) to iron(III) (Ferric oxidation)",
                "Oxidation of isopropanol to acetone (Isopropanol oxidation)",
                "Oxidation of methane to methanol in methanotrophs (Methane oxidation)",
                "Oxidation of methanol to formaldehyde (Methanol oxidation)",
                "Oxidation of nitrite to nitrate in nitrification (Nitrite oxidation)",
                "Oxidation of nitrogen in the nitrogen cycle (Nitrogen oxidation)",
                "Oxidation of phenols to quinones (Phenol oxidation)",
                "Oxidation of sulfide to sulfate in sulfur bacteria (Sulfide oxidation)",
                "Oxidation of sulfur in pyrite to sulfate (Pyrite oxidation)",
                "Oxidation of thiol groups to disulfides (Thiol oxidation)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Oxidation of Glucose (Glycolysis)",
            "Oxidation of Fatty Acids (Beta-Oxidation)",
            "Oxidation of Alcohol",
            "Oxidation of Ammonia to Nitrite",
            "Oxidation of Methane to Methanol",
            "Oxidation of Ethanol to Acetaldehyde",
            "Oxidation of Ferrous Iron (Fe2+) to Ferric Iron (Fe3+)",
            "Oxidation of Ascorbic Acid",
            "Oxidation of Sulfur Dioxide to Sulfur Trioxide",
            "Oxidation of Carbon Monoxide to Carbon Dioxide",
            "Oxidation of Hydrogen Peroxide to Oxygen",
            "Oxidation of Hydroquinone to Benzoquinone",
            "Oxidation of Phenols",
            "Oxidation of Aldehydes to Carboxylic Acids",
            "Oxidation of Primary Alcohols to Aldehydes",
            "Oxidation of Secondary Alcohols to Ketones",
            "Oxidation of Tertiary Alcohols",
            "Oxidation of Thiols to Disulfides",
            "Oxidation of Phenols to Quinones",
            "Oxidation of Amines to Nitro Compounds",
            "Oxidation of Hydrocarbons",
            "Oxidation of Organic Sulfur Compounds",
            "Oxidation of Organic Nitrogen Compounds",
            "Oxidation of Organic Phosphorus Compounds"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Oxidation of Glucose (Glycolysis)",
                "Oxidation of Fatty Acids (Beta-Oxidation)",
                "Oxidation of Alcohol",
                "Oxidation of Ammonia to Nitrite",
                "Oxidation of Methane to Methanol",
                "Oxidation of Ethanol to Acetaldehyde",
                "Oxidation of Ferrous Iron (Fe2+) to Ferric Iron (Fe3+)",
                "Oxidation of Ascorbic Acid",
                "Oxidation of Sulfur Dioxide to Sulfur Trioxide",
                "Oxidation of Carbon Monoxide to Carbon Dioxide",
                "Oxidation of Hydrogen Peroxide to Oxygen",
                "Oxidation of Hydroquinone to Benzoquinone",
                "Oxidation of Phenols",
                "Oxidation of Aldehydes to Carboxylic Acids",
                "Oxidation of Primary Alcohols to Aldehydes",
                "Oxidation of Secondary Alcohols to Ketones",
                "Oxidation of Tertiary Alcohols",
                "Oxidation of Thiols to Disulfides",
                "Oxidation of Phenols to Quinones",
                "Oxidation of Amines to Nitro Compounds",
                "Oxidation of Hydrocarbons",
                "Oxidation of Organic Sulfur Compounds",
                "Oxidation of Organic Nitrogen Compounds",
                "Oxidation of Organic Phosphorus Compounds"
            ],
            "mismatches": [],
            "true_referents": [
                "Oxidation of Alcohol",
                "Oxidation of Aldehydes to Carboxylic Acids",
                "Oxidation of Amines to Nitro Compounds",
                "Oxidation of Ammonia to Nitrite",
                "Oxidation of Ascorbic Acid",
                "Oxidation of Carbon Monoxide to Carbon Dioxide",
                "Oxidation of Ethanol to Acetaldehyde",
                "Oxidation of Fatty Acids (Beta-Oxidation)",
                "Oxidation of Ferrous Iron (Fe2+) to Ferric Iron (Fe3+)",
                "Oxidation of Glucose (Glycolysis)",
                "Oxidation of Hydrocarbons",
                "Oxidation of Hydrogen Peroxide to Oxygen",
                "Oxidation of Hydroquinone to Benzoquinone",
                "Oxidation of Methane to Methanol",
                "Oxidation of Organic Nitrogen Compounds",
                "Oxidation of Organic Phosphorus Compounds",
                "Oxidation of Organic Sulfur Compounds",
                "Oxidation of Phenols",
                "Oxidation of Phenols to Quinones",
                "Oxidation of Primary Alcohols to Aldehydes",
                "Oxidation of Secondary Alcohols to Ketones",
                "Oxidation of Sulfur Dioxide to Sulfur Trioxide",
                "Oxidation of Tertiary Alcohols",
                "Oxidation of Thiols to Disulfides"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Combustion (Comb)",
            "Corrosion (Corr)",
            "Respiration (Resp)",
            "Metal Rusting (Rust)",
            "Bleaching (Bleach)",
            "Photodegradation of Polymers (PhotoDeg)",
            "Hemoglobin Oxidation (HbOx)",
            "Glucose Oxidation (GlcOx)",
            "Ethanol Metabolism (EtOHMetab)",
            "Lignin Decomposition (LigninDecomp)",
            "Iron Oxidation in Hemerythrin (HemyOx)",
            "Silver Tarnish (AgTarnish)",
            "Formation of Metal Oxides (MetalOx)",
            "Oxidation of Aldehydes to Carboxylic Acids (AldOx)",
            "Oxidation of Alcohols to Ketones/Aldehydes (AlcOx)",
            "Oxidative Phosphorylation (OxPhos)",
            "Mitochondrial Electron Transport Chain (ETC)",
            "Lipid Peroxidation (LipPerox)",
            "Dopamine to Dopaquinones Conversion (DAtoDAQ)",
            "GSH Oxidation in Glutathione Peroxidase (GSHOx)",
            "Catecholamine Oxidation (CatOx)",
            "Myoglobin Oxygenation (MyoOx)",
            "Vitamin C Degradation (VitCDeg)",
            "Polycyclic Aromatic Hydrocarbon Oxidation (PAHOx)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Combustion (Comb)",
                "Corrosion (Corr)",
                "Respiration (Resp)",
                "Metal Rusting (Rust)",
                "Bleaching (Bleach)",
                "Photodegradation of Polymers (PhotoDeg)",
                "Hemoglobin Oxidation (HbOx)",
                "Glucose Oxidation (GlcOx)",
                "Ethanol Metabolism (EtOHMetab)",
                "Lignin Decomposition (LigninDecomp)",
                "Iron Oxidation in Hemerythrin (HemyOx)",
                "Silver Tarnish (AgTarnish)",
                "Formation of Metal Oxides (MetalOx)",
                "Oxidation of Aldehydes to Carboxylic Acids (AldOx)",
                "Oxidation of Alcohols to Ketones/Aldehydes (AlcOx)",
                "Oxidative Phosphorylation (OxPhos)",
                "Mitochondrial Electron Transport Chain (ETC)",
                "Lipid Peroxidation (LipPerox)",
                "Dopamine to Dopaquinones Conversion (DAtoDAQ)",
                "GSH Oxidation in Glutathione Peroxidase (GSHOx)",
                "Catecholamine Oxidation (CatOx)",
                "Myoglobin Oxygenation (MyoOx)",
                "Vitamin C Degradation (VitCDeg)",
                "Polycyclic Aromatic Hydrocarbon Oxidation (PAHOx)"
            ],
            "mismatches": [],
            "true_referents": [
                "Bleaching (Bleach)",
                "Catecholamine Oxidation (CatOx)",
                "Combustion (Comb)",
                "Corrosion (Corr)",
                "Dopamine to Dopaquinones Conversion (DAtoDAQ)",
                "Ethanol Metabolism (EtOHMetab)",
                "Formation of Metal Oxides (MetalOx)",
                "GSH Oxidation in Glutathione Peroxidase (GSHOx)",
                "Glucose Oxidation (GlcOx)",
                "Hemoglobin Oxidation (HbOx)",
                "Iron Oxidation in Hemerythrin (HemyOx)",
                "Lignin Decomposition (LigninDecomp)",
                "Lipid Peroxidation (LipPerox)",
                "Metal Rusting (Rust)",
                "Mitochondrial Electron Transport Chain (ETC)",
                "Myoglobin Oxygenation (MyoOx)",
                "Oxidation of Alcohols to Ketones/Aldehydes (AlcOx)",
                "Oxidation of Aldehydes to Carboxylic Acids (AldOx)",
                "Oxidative Phosphorylation (OxPhos)",
                "Photodegradation of Polymers (PhotoDeg)",
                "Polycyclic Aromatic Hydrocarbon Oxidation (PAHOx)",
                "Respiration (Resp)",
                "Silver Tarnish (AgTarnish)",
                "Vitamin C Degradation (VitCDeg)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Combustion of Methane (CH4)",
            "Oxidation of Glucose (C6H12O6)",
            "Rusting of Iron (Fe)",
            "Oxidation of Ethanol (C2H5OH)",
            "Formation of Sulfur Dioxide (SO2)",
            "Oxidation of Ammonia (NH3)",
            "Oxidation of Hydrogen Sulfide (H2S)",
            "Conversion of Ferrous to Ferric Ion (Fe2+ to Fe3+)",
            "Oxidation of Formaldehyde (CH2O)",
            "Oxidation of Carbon Monoxide (CO)",
            "Oxidation of Iodide to Iodine (I- to I2)",
            "Oxidation of Nitric Oxide to Nitrogen Dioxide (NO to NO2)",
            "Oxidation of Sulfite to Sulfate (SO3 2- to SO4 2-)",
            "Oxidation of Benzene to Phenol (C6H6 to C6H5OH)",
            "Oxidation of Acetaldehyde to Acetic Acid (CH3CHO to CH3COOH)",
            "Oxidation of Thiol to Disulfide (RSH to RSSR)",
            "Oxidation of Cyclohexanol to Cyclohexanone",
            "Oxidation of Ascorbic Acid (Vitamin C)",
            "Oxidation of Cysteine to Cystine",
            "Oxidation of Pyruvate to Acetyl-CoA",
            "Oxidation of Ubiquinol to Ubiquinone",
            "Oxidation of NADH to NAD+",
            "Oxidation of FADH2 to FAD",
            "Oxidation of Sulfur to Sulfuric Acid (S to H2SO4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Combustion of Methane (CH4)",
                "Oxidation of Glucose (C6H12O6)",
                "Rusting of Iron (Fe)",
                "Oxidation of Ethanol (C2H5OH)",
                "Formation of Sulfur Dioxide (SO2)",
                "Oxidation of Ammonia (NH3)",
                "Oxidation of Hydrogen Sulfide (H2S)",
                "Conversion of Ferrous to Ferric Ion (Fe2+ to Fe3+)",
                "Oxidation of Formaldehyde (CH2O)",
                "Oxidation of Carbon Monoxide (CO)",
                "Oxidation of Iodide to Iodine (I- to I2)",
                "Oxidation of Nitric Oxide to Nitrogen Dioxide (NO to NO2)",
                "Oxidation of Sulfite to Sulfate (SO3 2- to SO4 2-)",
                "Oxidation of Benzene to Phenol (C6H6 to C6H5OH)",
                "Oxidation of Acetaldehyde to Acetic Acid (CH3CHO to CH3COOH)",
                "Oxidation of Thiol to Disulfide (RSH to RSSR)",
                "Oxidation of Cyclohexanol to Cyclohexanone",
                "Oxidation of Ascorbic Acid (Vitamin C)",
                "Oxidation of Cysteine to Cystine",
                "Oxidation of Pyruvate to Acetyl-CoA",
                "Oxidation of Ubiquinol to Ubiquinone",
                "Oxidation of NADH to NAD+",
                "Oxidation of FADH2 to FAD",
                "Oxidation of Sulfur to Sulfuric Acid (S to H2SO4)"
            ],
            "mismatches": [],
            "true_referents": [
                "Combustion of Methane (CH4)",
                "Conversion of Ferrous to Ferric Ion (Fe2+ to Fe3+)",
                "Formation of Sulfur Dioxide (SO2)",
                "Oxidation of Acetaldehyde to Acetic Acid (CH3CHO to CH3COOH)",
                "Oxidation of Ammonia (NH3)",
                "Oxidation of Ascorbic Acid (Vitamin C)",
                "Oxidation of Benzene to Phenol (C6H6 to C6H5OH)",
                "Oxidation of Carbon Monoxide (CO)",
                "Oxidation of Cyclohexanol to Cyclohexanone",
                "Oxidation of Cysteine to Cystine",
                "Oxidation of Ethanol (C2H5OH)",
                "Oxidation of FADH2 to FAD",
                "Oxidation of Formaldehyde (CH2O)",
                "Oxidation of Glucose (C6H12O6)",
                "Oxidation of Hydrogen Sulfide (H2S)",
                "Oxidation of Iodide to Iodine (I- to I2)",
                "Oxidation of NADH to NAD+",
                "Oxidation of Nitric Oxide to Nitrogen Dioxide (NO to NO2)",
                "Oxidation of Pyruvate to Acetyl-CoA",
                "Oxidation of Sulfite to Sulfate (SO3 2- to SO4 2-)",
                "Oxidation of Sulfur to Sulfuric Acid (S to H2SO4)",
                "Oxidation of Thiol to Disulfide (RSH to RSSR)",
                "Oxidation of Ubiquinol to Ubiquinone",
                "Rusting of Iron (Fe)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Combustion of hydrocarbons (CH4)",
            "Oxidation of iron (Fe to Fe2+)",
            "Respiration in aerobic organisms (C6H12O6)",
            "Oxidation of glucose (C6H12O6 to CO2)",
            "Oxidation of ethanol to acetaldehyde (C2H5OH)",
            "Oxidation of sulfur dioxide to sulfur trioxide (SO2 to SO3)",
            "Oxidation of hydrogen sulfide to sulfur (H2S to S)",
            "Oxidation of ammonia to nitrite (NH3 to NO2-)",
            "Oxidation of magnesium (Mg to Mg2+)",
            "Oxidation of copper (Cu to Cu2+)",
            "Oxidation of silver (Ag to Ag+)",
            "Oxidation of glucose to gluconic acid (C6H12O6 to C6H12O7)",
            "Oxidation of ascorbic acid (C6H8O6 to C6H6O6)",
            "Oxidation of fatty acids in beta-oxidation (C16H32O2)",
            "Oxidation of phenol to quinone (C6H5OH to C6H4O2)",
            "Oxidation of pyruvate to acetyl-CoA (C3H4O3 to C2H3O-CoA)",
            "Oxidation of hydrogen gas to protons (H2 to 2H+)",
            "Oxidation of sodium thiosulfate to sulfate (Na2S2O3 to Na2SO4)",
            "Oxidation of glucose-6-phosphate to 6-phosphogluconate (C6H13O9P)",
            "Oxidation of cholesterol to bile acids (C27H46O)",
            "Oxidation of lactate to pyruvate (C3H6O3 to C3H4O3)",
            "Oxidation of 2-propanol to acetone (C3H8O to C3H6O)",
            "Oxidation of aldehydes to carboxylic acids (RCHO to RCOOH)",
            "Oxidation of ferrous ions to ferric ions (Fe2+ to Fe3+)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Combustion of hydrocarbons (CH4)",
                "Oxidation of iron (Fe to Fe2+)",
                "Respiration in aerobic organisms (C6H12O6)",
                "Oxidation of glucose (C6H12O6 to CO2)",
                "Oxidation of ethanol to acetaldehyde (C2H5OH)",
                "Oxidation of sulfur dioxide to sulfur trioxide (SO2 to SO3)",
                "Oxidation of hydrogen sulfide to sulfur (H2S to S)",
                "Oxidation of ammonia to nitrite (NH3 to NO2-)",
                "Oxidation of magnesium (Mg to Mg2+)",
                "Oxidation of copper (Cu to Cu2+)",
                "Oxidation of silver (Ag to Ag+)",
                "Oxidation of glucose to gluconic acid (C6H12O6 to C6H12O7)",
                "Oxidation of ascorbic acid (C6H8O6 to C6H6O6)",
                "Oxidation of fatty acids in beta-oxidation (C16H32O2)",
                "Oxidation of phenol to quinone (C6H5OH to C6H4O2)",
                "Oxidation of pyruvate to acetyl-CoA (C3H4O3 to C2H3O-CoA)",
                "Oxidation of hydrogen gas to protons (H2 to 2H+)",
                "Oxidation of sodium thiosulfate to sulfate (Na2S2O3 to Na2SO4)",
                "Oxidation of glucose-6-phosphate to 6-phosphogluconate (C6H13O9P)",
                "Oxidation of cholesterol to bile acids (C27H46O)",
                "Oxidation of lactate to pyruvate (C3H6O3 to C3H4O3)",
                "Oxidation of 2-propanol to acetone (C3H8O to C3H6O)",
                "Oxidation of aldehydes to carboxylic acids (RCHO to RCOOH)",
                "Oxidation of ferrous ions to ferric ions (Fe2+ to Fe3+)"
            ],
            "mismatches": [],
            "true_referents": [
                "Combustion of hydrocarbons (CH4)",
                "Oxidation of 2-propanol to acetone (C3H8O to C3H6O)",
                "Oxidation of aldehydes to carboxylic acids (RCHO to RCOOH)",
                "Oxidation of ammonia to nitrite (NH3 to NO2-)",
                "Oxidation of ascorbic acid (C6H8O6 to C6H6O6)",
                "Oxidation of cholesterol to bile acids (C27H46O)",
                "Oxidation of copper (Cu to Cu2+)",
                "Oxidation of ethanol to acetaldehyde (C2H5OH)",
                "Oxidation of fatty acids in beta-oxidation (C16H32O2)",
                "Oxidation of ferrous ions to ferric ions (Fe2+ to Fe3+)",
                "Oxidation of glucose (C6H12O6 to CO2)",
                "Oxidation of glucose to gluconic acid (C6H12O6 to C6H12O7)",
                "Oxidation of glucose-6-phosphate to 6-phosphogluconate (C6H13O9P)",
                "Oxidation of hydrogen gas to protons (H2 to 2H+)",
                "Oxidation of hydrogen sulfide to sulfur (H2S to S)",
                "Oxidation of iron (Fe to Fe2+)",
                "Oxidation of lactate to pyruvate (C3H6O3 to C3H4O3)",
                "Oxidation of magnesium (Mg to Mg2+)",
                "Oxidation of phenol to quinone (C6H5OH to C6H4O2)",
                "Oxidation of pyruvate to acetyl-CoA (C3H4O3 to C2H3O-CoA)",
                "Oxidation of silver (Ag to Ag+)",
                "Oxidation of sodium thiosulfate to sulfate (Na2S2O3 to Na2SO4)",
                "Oxidation of sulfur dioxide to sulfur trioxide (SO2 to SO3)",
                "Respiration in aerobic organisms (C6H12O6)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Combustion Reaction (CR)",
            "Respiration (R)",
            "Electron Transport Chain (ETC)",
            "Oxidation of Glucose (OG)",
            "Oxidation of Hydrogen Peroxide (OHP)",
            "Rusting of Iron (RI)",
            "Corrosion (C)",
            "Bleaching (B)",
            "Oxidation of Sodium (OS)",
            "Oxidation of Hydrogen (OH)",
            "Oxidation of Magnesium (OM)",
            "Oxidation of Sulfur (OSu)",
            "Oxidation of Nitrogen (ON)",
            "Oxidation of Carbon (OC)",
            "Oxidation of Phosphorus (OP)",
            "Oxidation of Chlorine (OCl)",
            "Oxidation of Potassium (OPo)",
            "Oxidation of Calcium (OCa)",
            "Oxidation of Zinc (OZ)",
            "Oxidation of Copper (OCu)",
            "Oxidation of Aluminum (OA)",
            "Oxidation of Silver (OSi)",
            "Oxidation of Gold (OG)",
            "Oxidation of Platinum (OPt)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Combustion Reaction (CR)",
                "Respiration (R)",
                "Electron Transport Chain (ETC)",
                "Oxidation of Glucose (OG)",
                "Oxidation of Hydrogen Peroxide (OHP)",
                "Rusting of Iron (RI)",
                "Corrosion (C)",
                "Bleaching (B)",
                "Oxidation of Sodium (OS)",
                "Oxidation of Hydrogen (OH)",
                "Oxidation of Magnesium (OM)",
                "Oxidation of Sulfur (OSu)",
                "Oxidation of Nitrogen (ON)",
                "Oxidation of Carbon (OC)",
                "Oxidation of Phosphorus (OP)",
                "Oxidation of Chlorine (OCl)",
                "Oxidation of Potassium (OPo)",
                "Oxidation of Calcium (OCa)",
                "Oxidation of Zinc (OZ)",
                "Oxidation of Copper (OCu)",
                "Oxidation of Aluminum (OA)",
                "Oxidation of Silver (OSi)",
                "Oxidation of Gold (OG)",
                "Oxidation of Platinum (OPt)"
            ],
            "mismatches": [],
            "true_referents": [
                "Bleaching (B)",
                "Combustion Reaction (CR)",
                "Corrosion (C)",
                "Electron Transport Chain (ETC)",
                "Oxidation of Aluminum (OA)",
                "Oxidation of Calcium (OCa)",
                "Oxidation of Carbon (OC)",
                "Oxidation of Chlorine (OCl)",
                "Oxidation of Copper (OCu)",
                "Oxidation of Glucose (OG)",
                "Oxidation of Gold (OG)",
                "Oxidation of Hydrogen (OH)",
                "Oxidation of Hydrogen Peroxide (OHP)",
                "Oxidation of Magnesium (OM)",
                "Oxidation of Nitrogen (ON)",
                "Oxidation of Phosphorus (OP)",
                "Oxidation of Platinum (OPt)",
                "Oxidation of Potassium (OPo)",
                "Oxidation of Silver (OSi)",
                "Oxidation of Sodium (OS)",
                "Oxidation of Sulfur (OSu)",
                "Oxidation of Zinc (OZ)",
                "Respiration (R)",
                "Rusting of Iron (RI)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Oxidation of glucose in cellular respiration (GLU-OX)",
            "Oxidation of fatty acids in beta-oxidation (FA-OX)",
            "Oxidation of ethanol in alcoholic fermentation (ETH-OX)",
            "Oxidation of pyruvate in the citric acid cycle (PYR-OX)",
            "Oxidation of NADH in the electron transport chain (NADH-OX)",
            "Oxidation of DNA bases by reactive oxygen species (DNA-OX)",
            "Oxidation of lipids in lipid peroxidation (LIP-OX)",
            "Oxidation of amino acids in protein catabolism (AA-OX)",
            "Oxidation of iron in the rusting process (FE-OX)",
            "Oxidation of hydrogen peroxide by catalase (H2O2-OX)",
            "Oxidation of ascorbic acid in the presence of oxygen (VITC-OX)",
            "Oxidation of dopamine in the brain (DA-OX)",
            "Oxidation of cholesterol in the formation of plaque (CHOL-OX)",
            "Oxidation of ethanol in the liver (ETH-LIV-OX)",
            "Oxidation of glucose in glycolysis (GLU-GLY-OX)",
            "Oxidation of fatty acids in lipolysis (FA-LIP-OX)",
            "Oxidation of acetate in the tricarboxylic acid cycle (ACET-OX)",
            "Oxidation of NADPH in the pentose phosphate pathway (NADPH-OX)",
            "Oxidation of purines in purine catabolism (PUR-OX)",
            "Oxidation of heme in the breakdown of red blood cells (HEME-OX)",
            "Oxidation of methanol in the liver (MET-LIV-OX)",
            "Oxidation of glucose in gluconeogenesis (GLU-GLN-OX)",
            "Oxidation of fatty acids in adipose tissue (FA-ADI-OX)",
            "Oxidation of ethanol in the brain (ETH-BRAIN-OX)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Oxidation of glucose in cellular respiration (GLU-OX)",
                "Oxidation of fatty acids in beta-oxidation (FA-OX)",
                "Oxidation of ethanol in alcoholic fermentation (ETH-OX)",
                "Oxidation of pyruvate in the citric acid cycle (PYR-OX)",
                "Oxidation of NADH in the electron transport chain (NADH-OX)",
                "Oxidation of DNA bases by reactive oxygen species (DNA-OX)",
                "Oxidation of lipids in lipid peroxidation (LIP-OX)",
                "Oxidation of amino acids in protein catabolism (AA-OX)",
                "Oxidation of iron in the rusting process (FE-OX)",
                "Oxidation of hydrogen peroxide by catalase (H2O2-OX)",
                "Oxidation of ascorbic acid in the presence of oxygen (VITC-OX)",
                "Oxidation of dopamine in the brain (DA-OX)",
                "Oxidation of cholesterol in the formation of plaque (CHOL-OX)",
                "Oxidation of ethanol in the liver (ETH-LIV-OX)",
                "Oxidation of glucose in glycolysis (GLU-GLY-OX)",
                "Oxidation of fatty acids in lipolysis (FA-LIP-OX)",
                "Oxidation of acetate in the tricarboxylic acid cycle (ACET-OX)",
                "Oxidation of NADPH in the pentose phosphate pathway (NADPH-OX)",
                "Oxidation of purines in purine catabolism (PUR-OX)",
                "Oxidation of heme in the breakdown of red blood cells (HEME-OX)",
                "Oxidation of methanol in the liver (MET-LIV-OX)",
                "Oxidation of glucose in gluconeogenesis (GLU-GLN-OX)",
                "Oxidation of fatty acids in adipose tissue (FA-ADI-OX)",
                "Oxidation of ethanol in the brain (ETH-BRAIN-OX)"
            ],
            "mismatches": [],
            "true_referents": [
                "Oxidation of DNA bases by reactive oxygen species (DNA-OX)",
                "Oxidation of NADH in the electron transport chain (NADH-OX)",
                "Oxidation of NADPH in the pentose phosphate pathway (NADPH-OX)",
                "Oxidation of acetate in the tricarboxylic acid cycle (ACET-OX)",
                "Oxidation of amino acids in protein catabolism (AA-OX)",
                "Oxidation of ascorbic acid in the presence of oxygen (VITC-OX)",
                "Oxidation of cholesterol in the formation of plaque (CHOL-OX)",
                "Oxidation of dopamine in the brain (DA-OX)",
                "Oxidation of ethanol in alcoholic fermentation (ETH-OX)",
                "Oxidation of ethanol in the brain (ETH-BRAIN-OX)",
                "Oxidation of ethanol in the liver (ETH-LIV-OX)",
                "Oxidation of fatty acids in adipose tissue (FA-ADI-OX)",
                "Oxidation of fatty acids in beta-oxidation (FA-OX)",
                "Oxidation of fatty acids in lipolysis (FA-LIP-OX)",
                "Oxidation of glucose in cellular respiration (GLU-OX)",
                "Oxidation of glucose in gluconeogenesis (GLU-GLN-OX)",
                "Oxidation of glucose in glycolysis (GLU-GLY-OX)",
                "Oxidation of heme in the breakdown of red blood cells (HEME-OX)",
                "Oxidation of hydrogen peroxide by catalase (H2O2-OX)",
                "Oxidation of iron in the rusting process (FE-OX)",
                "Oxidation of lipids in lipid peroxidation (LIP-OX)",
                "Oxidation of methanol in the liver (MET-LIV-OX)",
                "Oxidation of purines in purine catabolism (PUR-OX)",
                "Oxidation of pyruvate in the citric acid cycle (PYR-OX)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Methane Combustion (CH\u2084 + 2 O\u2082 \u2192 CO\u2082 + 2 H\u2082O)",
            "Rusting of Iron (4 Fe + 3 O\u2082 \u2192 2 Fe\u2082O\u2083)",
            "Ethanol Oxidation to Acetaldehyde (CH\u2083CH\u2082OH + [O] \u2192 CH\u2083CHO + H\u2082O)",
            "Ethanol Oxidation to Acetic Acid (CH\u2083CH\u2082OH + 2 [O] \u2192 CH\u2083COOH + H\u2082O)",
            "Benzaldehyde Oxidation to Benzoic Acid (C\u2086H\u2085CHO + [O] \u2192 C\u2086H\u2085COOH)",
            "Cyclohexanol Oxidation to Cyclohexanone (C\u2086H\u2081\u2081OH \u2192 C\u2086H\u2081\u2080O + H\u2082O)",
            "Isopropanol Oxidation to Acetone (CH\u2083CH(OH)CH\u2083 \u2192 CH\u2083COCH\u2083 + H\u2082O)",
            "Methanol Oxidation to Formaldehyde (CH\u2083OH + [O] \u2192 H\u2082CO + H\u2082O)",
            "Formaldehyde Oxidation to Formic Acid (H\u2082CO + [O] \u2192 HCOOH)",
            "Propylene Oxidation to Propionaldehyde (CH\u2083CH=CH\u2082 + [O] \u2192 CH\u2083CH\u2082CHO)",
            "Sulfide Oxidation to Sulfoxide (R-S-R' + [O] \u2192 R-S(O)-R')",
            "Sulfite Oxidation to Sulfate (SO\u2083\u00b2\u207b + [O] \u2192 SO\u2084\u00b2\u207b)",
            "Glucose Oxidation to Gluconic Acid (C\u2086H\u2081\u2082O\u2086 + [O] \u2192 C\u2086H\u2081\u2082O\u2087)",
            "Glycerol Oxidation to Dihydroxyacetone (C\u2083H\u2088O\u2083 + [O] \u2192 C\u2083H\u2086O\u2083 + H\u2082O)",
            "Toluene Oxidation to Benzaldehyde (C\u2086H\u2085CH\u2083 + [O] \u2192 C\u2086H\u2085CHO + H\u2082O)",
            "Toluene Oxidation to Benzoic Acid (C\u2086H\u2085CH\u2083 + 2 [O] \u2192 C\u2086H\u2085COOH + H\u2082O)",
            "p-Xylene Oxidation to Terephthalic Acid (C\u2088H\u2081\u2080 + 3 [O] \u2192 C\u2088H\u2086O\u2084 + H\u2082O)",
            "Styrene Oxidation to Benzaldehyde (C\u2088H\u2088 + [O] \u2192 C\u2087H\u2086CHO + H\u2082O)",
            "Lactic Acid Oxidation to Pyruvic Acid (C\u2083H\u2086O\u2083 + [O] \u2192 C\u2083H\u2084O\u2083 + H\u2082O)",
            "Catechol Oxidation to o-Quinone (C\u2086H\u2084(OH)\u2082 + [O] \u2192 C\u2086H\u2084O\u2082 + H\u2082O)",
            "Mannitol Oxidation to Mannonic Acid (C\u2086H\u2081\u2084O\u2086 + [O] \u2192 C\u2086H\u2081\u2084O\u2087)",
            "Aniline Oxidation to Nitrosobenzene (C\u2086H\u2085NH\u2082 + [O] \u2192 C\u2086H\u2085NHO)",
            "Benzyl Alcohol Oxidation to Benzaldehyde (C\u2086H\u2085CH\u2082OH + [O] \u2192 C\u2086H\u2085CHO + H\u2082O)",
            "p-Anisidine Oxidation to p-Nitroanisole (C\u2086H\u2085NHCH\u2083 + [O] \u2192 C\u2086H\u2085NOCH\u2083 + H\u2082O)",
            "Dimethyl Sulfoxide Oxidation to Dimethyl Sulfone (CH\u2083)\u2082SO + [O] \u2192 (CH\u2083)\u2082SO\u2082"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane Combustion (CH\u2084 + 2 O\u2082 \u2192 CO\u2082 + 2 H\u2082O)",
                "Rusting of Iron (4 Fe + 3 O\u2082 \u2192 2 Fe\u2082O\u2083)",
                "Ethanol Oxidation to Acetaldehyde (CH\u2083CH\u2082OH + [O] \u2192 CH\u2083CHO + H\u2082O)",
                "Ethanol Oxidation to Acetic Acid (CH\u2083CH\u2082OH + 2 [O] \u2192 CH\u2083COOH + H\u2082O)",
                "Benzaldehyde Oxidation to Benzoic Acid (C\u2086H\u2085CHO + [O] \u2192 C\u2086H\u2085COOH)",
                "Cyclohexanol Oxidation to Cyclohexanone (C\u2086H\u2081\u2081OH \u2192 C\u2086H\u2081\u2080O + H\u2082O)",
                "Isopropanol Oxidation to Acetone (CH\u2083CH(OH)CH\u2083 \u2192 CH\u2083COCH\u2083 + H\u2082O)",
                "Methanol Oxidation to Formaldehyde (CH\u2083OH + [O] \u2192 H\u2082CO + H\u2082O)",
                "Formaldehyde Oxidation to Formic Acid (H\u2082CO + [O] \u2192 HCOOH)",
                "Propylene Oxidation to Propionaldehyde (CH\u2083CH=CH\u2082 + [O] \u2192 CH\u2083CH\u2082CHO)",
                "Sulfide Oxidation to Sulfoxide (R-S-R' + [O] \u2192 R-S(O)-R')",
                "Sulfite Oxidation to Sulfate (SO\u2083\u00b2\u207b + [O] \u2192 SO\u2084\u00b2\u207b)",
                "Glucose Oxidation to Gluconic Acid (C\u2086H\u2081\u2082O\u2086 + [O] \u2192 C\u2086H\u2081\u2082O\u2087)",
                "Glycerol Oxidation to Dihydroxyacetone (C\u2083H\u2088O\u2083 + [O] \u2192 C\u2083H\u2086O\u2083 + H\u2082O)",
                "Toluene Oxidation to Benzaldehyde (C\u2086H\u2085CH\u2083 + [O] \u2192 C\u2086H\u2085CHO + H\u2082O)",
                "Toluene Oxidation to Benzoic Acid (C\u2086H\u2085CH\u2083 + 2 [O] \u2192 C\u2086H\u2085COOH + H\u2082O)",
                "p-Xylene Oxidation to Terephthalic Acid (C\u2088H\u2081\u2080 + 3 [O] \u2192 C\u2088H\u2086O\u2084 + H\u2082O)",
                "Styrene Oxidation to Benzaldehyde (C\u2088H\u2088 + [O] \u2192 C\u2087H\u2086CHO + H\u2082O)",
                "Lactic Acid Oxidation to Pyruvic Acid (C\u2083H\u2086O\u2083 + [O] \u2192 C\u2083H\u2084O\u2083 + H\u2082O)",
                "Catechol Oxidation to o-Quinone (C\u2086H\u2084(OH)\u2082 + [O] \u2192 C\u2086H\u2084O\u2082 + H\u2082O)",
                "Mannitol Oxidation to Mannonic Acid (C\u2086H\u2081\u2084O\u2086 + [O] \u2192 C\u2086H\u2081\u2084O\u2087)",
                "Aniline Oxidation to Nitrosobenzene (C\u2086H\u2085NH\u2082 + [O] \u2192 C\u2086H\u2085NHO)",
                "Benzyl Alcohol Oxidation to Benzaldehyde (C\u2086H\u2085CH\u2082OH + [O] \u2192 C\u2086H\u2085CHO + H\u2082O)",
                "p-Anisidine Oxidation to p-Nitroanisole (C\u2086H\u2085NHCH\u2083 + [O] \u2192 C\u2086H\u2085NOCH\u2083 + H\u2082O)"
            ],
            "mismatches": [
                "Dimethyl Sulfoxide Oxidation to Dimethyl Sulfone (CH\u2083)\u2082SO + [O] \u2192 (CH\u2083)\u2082SO\u2082"
            ],
            "true_referents": [
                "Aniline Oxidation to Nitrosobenzene (C\u2086H\u2085NH\u2082 + [O] \u2192 C\u2086H\u2085NHO)",
                "Benzaldehyde Oxidation to Benzoic Acid (C\u2086H\u2085CHO + [O] \u2192 C\u2086H\u2085COOH)",
                "Benzyl Alcohol Oxidation to Benzaldehyde (C\u2086H\u2085CH\u2082OH + [O] \u2192 C\u2086H\u2085CHO + H\u2082O)",
                "Catechol Oxidation to o-Quinone (C\u2086H\u2084(OH)\u2082 + [O] \u2192 C\u2086H\u2084O\u2082 + H\u2082O)",
                "Cyclohexanol Oxidation to Cyclohexanone (C\u2086H\u2081\u2081OH \u2192 C\u2086H\u2081\u2080O + H\u2082O)",
                "Ethanol Oxidation to Acetaldehyde (CH\u2083CH\u2082OH + [O] \u2192 CH\u2083CHO + H\u2082O)",
                "Ethanol Oxidation to Acetic Acid (CH\u2083CH\u2082OH + 2 [O] \u2192 CH\u2083COOH + H\u2082O)",
                "Formaldehyde Oxidation to Formic Acid (H\u2082CO + [O] \u2192 HCOOH)",
                "Glucose Oxidation to Gluconic Acid (C\u2086H\u2081\u2082O\u2086 + [O] \u2192 C\u2086H\u2081\u2082O\u2087)",
                "Glycerol Oxidation to Dihydroxyacetone (C\u2083H\u2088O\u2083 + [O] \u2192 C\u2083H\u2086O\u2083 + H\u2082O)",
                "Isopropanol Oxidation to Acetone (CH\u2083CH(OH)CH\u2083 \u2192 CH\u2083COCH\u2083 + H\u2082O)",
                "Lactic Acid Oxidation to Pyruvic Acid (C\u2083H\u2086O\u2083 + [O] \u2192 C\u2083H\u2084O\u2083 + H\u2082O)",
                "Mannitol Oxidation to Mannonic Acid (C\u2086H\u2081\u2084O\u2086 + [O] \u2192 C\u2086H\u2081\u2084O\u2087)",
                "Methane Combustion (CH\u2084 + 2 O\u2082 \u2192 CO\u2082 + 2 H\u2082O)",
                "Methanol Oxidation to Formaldehyde (CH\u2083OH + [O] \u2192 H\u2082CO + H\u2082O)",
                "Propylene Oxidation to Propionaldehyde (CH\u2083CH=CH\u2082 + [O] \u2192 CH\u2083CH\u2082CHO)",
                "Rusting of Iron (4 Fe + 3 O\u2082 \u2192 2 Fe\u2082O\u2083)",
                "Styrene Oxidation to Benzaldehyde (C\u2088H\u2088 + [O] \u2192 C\u2087H\u2086CHO + H\u2082O)",
                "Sulfide Oxidation to Sulfoxide (R-S-R' + [O] \u2192 R-S(O)-R')",
                "Sulfite Oxidation to Sulfate (SO\u2083\u00b2\u207b + [O] \u2192 SO\u2084\u00b2\u207b)",
                "Toluene Oxidation to Benzaldehyde (C\u2086H\u2085CH\u2083 + [O] \u2192 C\u2086H\u2085CHO + H\u2082O)",
                "Toluene Oxidation to Benzoic Acid (C\u2086H\u2085CH\u2083 + 2 [O] \u2192 C\u2086H\u2085COOH + H\u2082O)",
                "p-Anisidine Oxidation to p-Nitroanisole (C\u2086H\u2085NHCH\u2083 + [O] \u2192 C\u2086H\u2085NOCH\u2083 + H\u2082O)",
                "p-Xylene Oxidation to Terephthalic Acid (C\u2088H\u2081\u2080 + 3 [O] \u2192 C\u2088H\u2086O\u2084 + H\u2082O)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Oxidation of iron to form rust (Fe \u2192 Fe2+ + 2e-)",
            "Combustion of methane (CH4 + 2O2 \u2192 CO2 + 2H2O)",
            "Oxidation of glucose in cellular respiration (C6H12O6 + 6O2 \u2192 6CO2 + 6H2O)",
            "Oxidation of ethanol by alcohol dehydrogenase (CH3CH2OH \u2192 CH3CHO + 2H+ + 2e-)",
            "Oxidation of sulfite to sulfate (SO32- \u2192 SO42- + 2e-)",
            "Oxidation of hydrogen peroxide by catalase (H2O2 \u2192 O2 + 2H+ + 2e-)",
            "Oxidation of NADH to NAD+ (NADH \u2192 NAD+ + H+ + 2e-)",
            "Oxidation of ascorbic acid (vitamin C) to dehydroascorbic acid",
            "Oxidation of dopamine by monoamine oxidase (MAO)",
            "Oxidation of adrenaline by catechol-O-methyltransferase (COMT)",
            "Oxidation of nitric oxide to nitrogen dioxide (2NO + O2 \u2192 2NO2)",
            "Oxidation of sulfur dioxide to sulfur trioxide (2SO2 + O2 \u2192 2SO3)",
            "Oxidation of ammonia to nitric acid (NH3 + 2O2 \u2192 HNO3 + H2O)",
            "Oxidation of carbon monoxide to carbon dioxide (2CO + O2 \u2192 2CO2)",
            "Oxidation of hydrogen sulfide to sulfur dioxide (2H2S + 3O2 \u2192 2SO2 + 2H2O)",
            "Oxidation of methanol to formaldehyde (CH3OH \u2192 CH2O + 2H+ + 2e-)",
            "Oxidation of benzaldehyde to benzoic acid (C6H5CHO + O2 \u2192 C6H5COOH)",
            "Oxidation of copper to copper(II) oxide (2Cu + O2 \u2192 2CuO)",
            "Oxidation of zinc in a galvanic cell (Zn \u2192 Zn2+ + 2e-)",
            "Oxidation of hydrogen gas to protons (H2 \u2192 2H+ + 2e-)",
            "Oxidation of iodide to iodine (2I- \u2192 I2 + 2e-)",
            "Oxidation of oxalate to carbon dioxide (C2O42- \u2192 2CO2 + 2e-)",
            "Oxidation of formate to carbon dioxide (HCOO- \u2192 CO2 + H+ + 2e-)",
            "Oxidation of nitrite to nitrate (NO2- + H2O \u2192 NO3- + 2H+ + 2e-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Oxidation of iron to form rust (Fe \u2192 Fe2+ + 2e-)",
                "Combustion of methane (CH4 + 2O2 \u2192 CO2 + 2H2O)",
                "Oxidation of glucose in cellular respiration (C6H12O6 + 6O2 \u2192 6CO2 + 6H2O)",
                "Oxidation of ethanol by alcohol dehydrogenase (CH3CH2OH \u2192 CH3CHO + 2H+ + 2e-)",
                "Oxidation of sulfite to sulfate (SO32- \u2192 SO42- + 2e-)",
                "Oxidation of hydrogen peroxide by catalase (H2O2 \u2192 O2 + 2H+ + 2e-)",
                "Oxidation of NADH to NAD+ (NADH \u2192 NAD+ + H+ + 2e-)",
                "Oxidation of ascorbic acid (vitamin C) to dehydroascorbic acid",
                "Oxidation of dopamine by monoamine oxidase (MAO)",
                "Oxidation of adrenaline by catechol-O-methyltransferase (COMT)",
                "Oxidation of nitric oxide to nitrogen dioxide (2NO + O2 \u2192 2NO2)",
                "Oxidation of sulfur dioxide to sulfur trioxide (2SO2 + O2 \u2192 2SO3)",
                "Oxidation of ammonia to nitric acid (NH3 + 2O2 \u2192 HNO3 + H2O)",
                "Oxidation of carbon monoxide to carbon dioxide (2CO + O2 \u2192 2CO2)",
                "Oxidation of hydrogen sulfide to sulfur dioxide (2H2S + 3O2 \u2192 2SO2 + 2H2O)",
                "Oxidation of methanol to formaldehyde (CH3OH \u2192 CH2O + 2H+ + 2e-)",
                "Oxidation of benzaldehyde to benzoic acid (C6H5CHO + O2 \u2192 C6H5COOH)",
                "Oxidation of copper to copper(II) oxide (2Cu + O2 \u2192 2CuO)",
                "Oxidation of zinc in a galvanic cell (Zn \u2192 Zn2+ + 2e-)",
                "Oxidation of hydrogen gas to protons (H2 \u2192 2H+ + 2e-)",
                "Oxidation of iodide to iodine (2I- \u2192 I2 + 2e-)",
                "Oxidation of oxalate to carbon dioxide (C2O42- \u2192 2CO2 + 2e-)",
                "Oxidation of formate to carbon dioxide (HCOO- \u2192 CO2 + H+ + 2e-)",
                "Oxidation of nitrite to nitrate (NO2- + H2O \u2192 NO3- + 2H+ + 2e-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Combustion of methane (CH4 + 2O2 \u2192 CO2 + 2H2O)",
                "Oxidation of NADH to NAD+ (NADH \u2192 NAD+ + H+ + 2e-)",
                "Oxidation of adrenaline by catechol-O-methyltransferase (COMT)",
                "Oxidation of ammonia to nitric acid (NH3 + 2O2 \u2192 HNO3 + H2O)",
                "Oxidation of ascorbic acid (vitamin C) to dehydroascorbic acid",
                "Oxidation of benzaldehyde to benzoic acid (C6H5CHO + O2 \u2192 C6H5COOH)",
                "Oxidation of carbon monoxide to carbon dioxide (2CO + O2 \u2192 2CO2)",
                "Oxidation of copper to copper(II) oxide (2Cu + O2 \u2192 2CuO)",
                "Oxidation of dopamine by monoamine oxidase (MAO)",
                "Oxidation of ethanol by alcohol dehydrogenase (CH3CH2OH \u2192 CH3CHO + 2H+ + 2e-)",
                "Oxidation of formate to carbon dioxide (HCOO- \u2192 CO2 + H+ + 2e-)",
                "Oxidation of glucose in cellular respiration (C6H12O6 + 6O2 \u2192 6CO2 + 6H2O)",
                "Oxidation of hydrogen gas to protons (H2 \u2192 2H+ + 2e-)",
                "Oxidation of hydrogen peroxide by catalase (H2O2 \u2192 O2 + 2H+ + 2e-)",
                "Oxidation of hydrogen sulfide to sulfur dioxide (2H2S + 3O2 \u2192 2SO2 + 2H2O)",
                "Oxidation of iodide to iodine (2I- \u2192 I2 + 2e-)",
                "Oxidation of iron to form rust (Fe \u2192 Fe2+ + 2e-)",
                "Oxidation of methanol to formaldehyde (CH3OH \u2192 CH2O + 2H+ + 2e-)",
                "Oxidation of nitric oxide to nitrogen dioxide (2NO + O2 \u2192 2NO2)",
                "Oxidation of nitrite to nitrate (NO2- + H2O \u2192 NO3- + 2H+ + 2e-)",
                "Oxidation of oxalate to carbon dioxide (C2O42- \u2192 2CO2 + 2e-)",
                "Oxidation of sulfite to sulfate (SO32- \u2192 SO42- + 2e-)",
                "Oxidation of sulfur dioxide to sulfur trioxide (2SO2 + O2 \u2192 2SO3)",
                "Oxidation of zinc in a galvanic cell (Zn \u2192 Zn2+ + 2e-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Combustion",
            "Rusting of iron (Fe)",
            "Browning of avocados",
            "Tarnishing of silver (Ag)",
            "Bleaching of hair",
            "Oxidation of ethanol to acetaldehyde",
            "Conversion of methane (CH4) to carbon dioxide (CO2)",
            "Oxidation of glucose in cellular respiration",
            "Conversion of ammonia (NH3) to nitric oxide (NO)",
            "Oxidation of sulfur dioxide (SO2) to sulfur trioxide (SO3)",
            "Oxidation of hydrogen sulfide (H2S) to sulfur (S)",
            "Conversion of primary alcohols to aldehydes",
            "Conversion of secondary alcohols to ketones",
            "Oxidation of hydroquinone to benzoquinone",
            "Conversion of catechol to ortho-benzoquinone",
            "Oxidation of ascorbic acid (vitamin C)",
            "Conversion of ferrous ion (Fe2+) to ferric ion (Fe3+)",
            "Oxidation of iodide ion (I-) to iodine (I2)",
            "Conversion of nitric oxide (NO) to nitrogen dioxide (NO2)",
            "Oxidation of carbon monoxide (CO) to carbon dioxide (CO2)",
            "Conversion of aniline to nitrobenzene",
            "Oxidation of phenol to catechol or hydroquinone",
            "Conversion of sulfite ion (SO32-) to sulfate ion (SO42-)",
            "Oxidation of thiosulfate ion (S2O32-) to tetrathionate ion (S4O62-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Combustion",
                "Rusting of iron (Fe)",
                "Browning of avocados",
                "Tarnishing of silver (Ag)",
                "Bleaching of hair",
                "Oxidation of ethanol to acetaldehyde",
                "Conversion of methane (CH4) to carbon dioxide (CO2)",
                "Oxidation of glucose in cellular respiration",
                "Conversion of ammonia (NH3) to nitric oxide (NO)",
                "Oxidation of sulfur dioxide (SO2) to sulfur trioxide (SO3)",
                "Oxidation of hydrogen sulfide (H2S) to sulfur (S)",
                "Conversion of primary alcohols to aldehydes",
                "Conversion of secondary alcohols to ketones",
                "Oxidation of hydroquinone to benzoquinone",
                "Conversion of catechol to ortho-benzoquinone",
                "Oxidation of ascorbic acid (vitamin C)",
                "Conversion of ferrous ion (Fe2+) to ferric ion (Fe3+)",
                "Oxidation of iodide ion (I-) to iodine (I2)",
                "Conversion of nitric oxide (NO) to nitrogen dioxide (NO2)",
                "Oxidation of carbon monoxide (CO) to carbon dioxide (CO2)",
                "Conversion of aniline to nitrobenzene",
                "Oxidation of phenol to catechol or hydroquinone",
                "Conversion of sulfite ion (SO32-) to sulfate ion (SO42-)",
                "Oxidation of thiosulfate ion (S2O32-) to tetrathionate ion (S4O62-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Bleaching of hair",
                "Browning of avocados",
                "Combustion",
                "Conversion of ammonia (NH3) to nitric oxide (NO)",
                "Conversion of aniline to nitrobenzene",
                "Conversion of catechol to ortho-benzoquinone",
                "Conversion of ferrous ion (Fe2+) to ferric ion (Fe3+)",
                "Conversion of methane (CH4) to carbon dioxide (CO2)",
                "Conversion of nitric oxide (NO) to nitrogen dioxide (NO2)",
                "Conversion of primary alcohols to aldehydes",
                "Conversion of secondary alcohols to ketones",
                "Conversion of sulfite ion (SO32-) to sulfate ion (SO42-)",
                "Oxidation of ascorbic acid (vitamin C)",
                "Oxidation of carbon monoxide (CO) to carbon dioxide (CO2)",
                "Oxidation of ethanol to acetaldehyde",
                "Oxidation of glucose in cellular respiration",
                "Oxidation of hydrogen sulfide (H2S) to sulfur (S)",
                "Oxidation of hydroquinone to benzoquinone",
                "Oxidation of iodide ion (I-) to iodine (I2)",
                "Oxidation of phenol to catechol or hydroquinone",
                "Oxidation of sulfur dioxide (SO2) to sulfur trioxide (SO3)",
                "Oxidation of thiosulfate ion (S2O32-) to tetrathionate ion (S4O62-)",
                "Rusting of iron (Fe)",
                "Tarnishing of silver (Ag)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Oxidation of iron (Fe) to iron oxide (Fe2O3)",
            "Combustion of methane (CH4)",
            "Oxidation of ethanol (C2H5OH) to ethanal (CH3CHO)",
            "Oxidation of glucose (C6H12O6) in cellular respiration",
            "Corrosion of metals",
            "Photosynthesis (light-dependent reactions)",
            "Oxidation of ammonia (NH3) to nitric acid (HNO3)",
            "Rusting of iron",
            "Oxidation of sulfur dioxide (SO2) to sulfur trioxide (SO3)",
            "Oxidation of hydrogen sulfide (H2S) to sulfur",
            "Oxidation of carbon monoxide (CO) to carbon dioxide (CO2)",
            "Oxidation of alcohols to aldehydes or ketones",
            "Oxidation of alkenes to alcohols",
            "Oxidation of primary alcohols to carboxylic acids",
            "Oxidation of secondary alcohols to ketones",
            "Oxidation of aldehydes to carboxylic acids",
            "Oxidation of phenols to quinones",
            "Oxidation of amines to nitroso compounds",
            "Oxidation of thiols to disulfides",
            "Oxidation of sulfites to sulfates",
            "Oxidation of ferrous iron (Fe2+) to ferric iron (Fe3+)",
            "Oxidation of cuprous copper (Cu+) to cupric copper (Cu2+)",
            "Oxidation of stannous tin (Sn2+) to stannic tin (Sn4+)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Oxidation of iron (Fe) to iron oxide (Fe2O3)",
                "Combustion of methane (CH4)",
                "Oxidation of ethanol (C2H5OH) to ethanal (CH3CHO)",
                "Oxidation of glucose (C6H12O6) in cellular respiration",
                "Corrosion of metals",
                "Photosynthesis (light-dependent reactions)",
                "Oxidation of ammonia (NH3) to nitric acid (HNO3)",
                "Rusting of iron",
                "Oxidation of sulfur dioxide (SO2) to sulfur trioxide (SO3)",
                "Oxidation of hydrogen sulfide (H2S) to sulfur",
                "Oxidation of carbon monoxide (CO) to carbon dioxide (CO2)",
                "Oxidation of alcohols to aldehydes or ketones",
                "Oxidation of alkenes to alcohols",
                "Oxidation of primary alcohols to carboxylic acids",
                "Oxidation of secondary alcohols to ketones",
                "Oxidation of aldehydes to carboxylic acids",
                "Oxidation of phenols to quinones",
                "Oxidation of amines to nitroso compounds",
                "Oxidation of thiols to disulfides",
                "Oxidation of sulfites to sulfates",
                "Oxidation of ferrous iron (Fe2+) to ferric iron (Fe3+)",
                "Oxidation of cuprous copper (Cu+) to cupric copper (Cu2+)",
                "Oxidation of stannous tin (Sn2+) to stannic tin (Sn4+)"
            ],
            "mismatches": [],
            "true_referents": [
                "Combustion of methane (CH4)",
                "Corrosion of metals",
                "Oxidation of alcohols to aldehydes or ketones",
                "Oxidation of aldehydes to carboxylic acids",
                "Oxidation of alkenes to alcohols",
                "Oxidation of amines to nitroso compounds",
                "Oxidation of ammonia (NH3) to nitric acid (HNO3)",
                "Oxidation of carbon monoxide (CO) to carbon dioxide (CO2)",
                "Oxidation of cuprous copper (Cu+) to cupric copper (Cu2+)",
                "Oxidation of ethanol (C2H5OH) to ethanal (CH3CHO)",
                "Oxidation of ferrous iron (Fe2+) to ferric iron (Fe3+)",
                "Oxidation of glucose (C6H12O6) in cellular respiration",
                "Oxidation of hydrogen sulfide (H2S) to sulfur",
                "Oxidation of iron (Fe) to iron oxide (Fe2O3)",
                "Oxidation of phenols to quinones",
                "Oxidation of primary alcohols to carboxylic acids",
                "Oxidation of secondary alcohols to ketones",
                "Oxidation of stannous tin (Sn2+) to stannic tin (Sn4+)",
                "Oxidation of sulfites to sulfates",
                "Oxidation of sulfur dioxide (SO2) to sulfur trioxide (SO3)",
                "Oxidation of thiols to disulfides",
                "Photosynthesis (light-dependent reactions)",
                "Rusting of iron"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Oxidation (OX)",
            "Combustion (COM)",
            "Photosynthesis (PHO)",
            "Cellular Respiration (CRS)",
            "Hydrogen Peroxide Decomposition (HPD)",
            "Methane Oxidation (MOX)",
            "Iron Rusting (IRR)",
            "Copper Tarnishing (CUT)",
            "Alcohol Dehydrogenation (ADH)",
            "Cytochrome P450 Catalysis (CPC)",
            "Amine Oxidation (AMO)",
            "Sulfide Oxidation (SOX)",
            "Chlorophyll Oxidation (CHO)",
            "Lipid Peroxidation (LPX)",
            "Hemoglobin Oxidation (HEO)",
            "Glucose Oxidation (GLO)",
            "Ammonia Oxidation (AMX)",
            "Methanol Combustion (MEC)",
            "Ethylene Oxidation (ETO)",
            "Ascorbic Acid Oxidation (AAO)",
            "Catechol Oxidation (CAO)",
            "Xanthine Oxidation (XAO)",
            "Glutathione Oxidation (GLX)",
            "Uric Acid Oxidation (UAO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Oxidation (OX)",
                "Combustion (COM)",
                "Photosynthesis (PHO)",
                "Cellular Respiration (CRS)",
                "Hydrogen Peroxide Decomposition (HPD)",
                "Methane Oxidation (MOX)",
                "Iron Rusting (IRR)",
                "Copper Tarnishing (CUT)",
                "Alcohol Dehydrogenation (ADH)",
                "Cytochrome P450 Catalysis (CPC)",
                "Amine Oxidation (AMO)",
                "Sulfide Oxidation (SOX)",
                "Chlorophyll Oxidation (CHO)",
                "Lipid Peroxidation (LPX)",
                "Hemoglobin Oxidation (HEO)",
                "Glucose Oxidation (GLO)",
                "Ammonia Oxidation (AMX)",
                "Methanol Combustion (MEC)",
                "Ethylene Oxidation (ETO)",
                "Ascorbic Acid Oxidation (AAO)",
                "Catechol Oxidation (CAO)",
                "Xanthine Oxidation (XAO)",
                "Glutathione Oxidation (GLX)",
                "Uric Acid Oxidation (UAO)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alcohol Dehydrogenation (ADH)",
                "Amine Oxidation (AMO)",
                "Ammonia Oxidation (AMX)",
                "Ascorbic Acid Oxidation (AAO)",
                "Catechol Oxidation (CAO)",
                "Cellular Respiration (CRS)",
                "Chlorophyll Oxidation (CHO)",
                "Combustion (COM)",
                "Copper Tarnishing (CUT)",
                "Cytochrome P450 Catalysis (CPC)",
                "Ethylene Oxidation (ETO)",
                "Glucose Oxidation (GLO)",
                "Glutathione Oxidation (GLX)",
                "Hemoglobin Oxidation (HEO)",
                "Hydrogen Peroxide Decomposition (HPD)",
                "Iron Rusting (IRR)",
                "Lipid Peroxidation (LPX)",
                "Methane Oxidation (MOX)",
                "Methanol Combustion (MEC)",
                "Oxidation (OX)",
                "Photosynthesis (PHO)",
                "Sulfide Oxidation (SOX)",
                "Uric Acid Oxidation (UAO)",
                "Xanthine Oxidation (XAO)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Oxidation reaction (Oxidation)",
            "Fenton reaction",
            "Haber-Weiss reaction",
            "Autoxidation",
            "Oxidation of glucose",
            "Oxidation of fatty acids",
            "Oxidation of amino acids",
            "Oxidation of cholesterol",
            "Oxidation of vitamins",
            "Oxidation of antioxidants",
            "Oxidation of DNA",
            "Oxidation of RNA",
            "Oxidation of proteins",
            "Oxidation of lipids",
            "Oxidation of carbohydrates",
            "Oxidation of xenobiotics",
            "Oxidation of pollutants",
            "Oxidation of heavy metals",
            "Oxidation of toxic compounds",
            "Oxidation of carcinogens",
            "Oxidation of mutagens",
            "Oxidation of teratogens",
            "Oxidation of allergens",
            "Oxidation of pro-inflammatory compounds"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Oxidation reaction (Oxidation)",
                "Fenton reaction",
                "Haber-Weiss reaction",
                "Autoxidation",
                "Oxidation of glucose",
                "Oxidation of fatty acids",
                "Oxidation of amino acids",
                "Oxidation of cholesterol",
                "Oxidation of vitamins",
                "Oxidation of antioxidants",
                "Oxidation of DNA",
                "Oxidation of RNA",
                "Oxidation of proteins",
                "Oxidation of lipids",
                "Oxidation of carbohydrates",
                "Oxidation of xenobiotics",
                "Oxidation of pollutants",
                "Oxidation of heavy metals",
                "Oxidation of toxic compounds",
                "Oxidation of carcinogens",
                "Oxidation of mutagens",
                "Oxidation of teratogens",
                "Oxidation of allergens",
                "Oxidation of pro-inflammatory compounds"
            ],
            "mismatches": [],
            "true_referents": [
                "Autoxidation",
                "Fenton reaction",
                "Haber-Weiss reaction",
                "Oxidation of DNA",
                "Oxidation of RNA",
                "Oxidation of allergens",
                "Oxidation of amino acids",
                "Oxidation of antioxidants",
                "Oxidation of carbohydrates",
                "Oxidation of carcinogens",
                "Oxidation of cholesterol",
                "Oxidation of fatty acids",
                "Oxidation of glucose",
                "Oxidation of heavy metals",
                "Oxidation of lipids",
                "Oxidation of mutagens",
                "Oxidation of pollutants",
                "Oxidation of pro-inflammatory compounds",
                "Oxidation of proteins",
                "Oxidation of teratogens",
                "Oxidation of toxic compounds",
                "Oxidation of vitamins",
                "Oxidation of xenobiotics",
                "Oxidation reaction (Oxidation)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": [
            "Oxidation of glucose to gluconic acid (GOX)",
            "Cytochrome P450-catalyzed oxidation of xenobiotics",
            "Fatty acid beta-oxidation (FAO)",
            "Oxidation of lactate to pyruvate (LDH)",
            "Catecholamine oxidation by monoamine oxidase (MAO)",
            "Oxidation of ethanol to acetaldehyde (ADH)",
            "Oxidation of xanthine to uric acid (XO)",
            "Oxidation of ascorbic acid to dehydroascorbic acid (AO)",
            "Oxidation of sulfite to sulfate (SulfO)",
            "Oxidation of nitric oxide to nitrate (NOX)",
            "Oxidation of dopamine to aminochrome (DAO)",
            "Oxidation of tryptophan to kynurenine (TDO)",
            "Oxidation of tyrosine to L-DOPA (TYO)",
            "Oxidation of cysteine to cystine (CDO)",
            "Oxidation of homocysteine to homocystine (HCYTO)",
            "Oxidation of flavin adenine dinucleotide (FAD) to flavin adenine dinucleotide oxidized (FADo)",
            "Oxidation of nicotinamide adenine dinucleotide (NAD) to nicotinamide adenine dinucleotide oxidized (NADo)",
            "Oxidation of nicotinamide adenine dinucleotide phosphate (NADP) to nicotinamide adenine dinucleotide phosphate oxidized (NADPo)",
            "Oxidation of ubiquinol to ubiquinone (CoQ)",
            "Oxidation of plastoquinol to plastoquinone (PQ)",
            "Oxidation of menaquinol to menaquinone (MK)",
            "Oxidation of riboflavin to flavin mononucleotide (RF)",
            "Oxidation of 5,6,7,8-tetrahydrobiopterin to 7,8-dihydrobiopterin (BH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Oxidation of glucose to gluconic acid (GOX)",
                "Cytochrome P450-catalyzed oxidation of xenobiotics",
                "Fatty acid beta-oxidation (FAO)",
                "Oxidation of lactate to pyruvate (LDH)",
                "Catecholamine oxidation by monoamine oxidase (MAO)",
                "Oxidation of ethanol to acetaldehyde (ADH)",
                "Oxidation of xanthine to uric acid (XO)",
                "Oxidation of ascorbic acid to dehydroascorbic acid (AO)",
                "Oxidation of sulfite to sulfate (SulfO)",
                "Oxidation of nitric oxide to nitrate (NOX)",
                "Oxidation of dopamine to aminochrome (DAO)",
                "Oxidation of tryptophan to kynurenine (TDO)",
                "Oxidation of tyrosine to L-DOPA (TYO)",
                "Oxidation of cysteine to cystine (CDO)",
                "Oxidation of homocysteine to homocystine (HCYTO)",
                "Oxidation of flavin adenine dinucleotide (FAD) to flavin adenine dinucleotide oxidized (FADo)",
                "Oxidation of nicotinamide adenine dinucleotide (NAD) to nicotinamide adenine dinucleotide oxidized (NADo)",
                "Oxidation of nicotinamide adenine dinucleotide phosphate (NADP) to nicotinamide adenine dinucleotide phosphate oxidized (NADPo)",
                "Oxidation of ubiquinol to ubiquinone (CoQ)",
                "Oxidation of plastoquinol to plastoquinone (PQ)",
                "Oxidation of menaquinol to menaquinone (MK)",
                "Oxidation of riboflavin to flavin mononucleotide (RF)",
                "Oxidation of 5,6,7,8-tetrahydrobiopterin to 7,8-dihydrobiopterin (BH2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Catecholamine oxidation by monoamine oxidase (MAO)",
                "Cytochrome P450-catalyzed oxidation of xenobiotics",
                "Fatty acid beta-oxidation (FAO)",
                "Oxidation of 5,6,7,8-tetrahydrobiopterin to 7,8-dihydrobiopterin (BH2)",
                "Oxidation of ascorbic acid to dehydroascorbic acid (AO)",
                "Oxidation of cysteine to cystine (CDO)",
                "Oxidation of dopamine to aminochrome (DAO)",
                "Oxidation of ethanol to acetaldehyde (ADH)",
                "Oxidation of flavin adenine dinucleotide (FAD) to flavin adenine dinucleotide oxidized (FADo)",
                "Oxidation of glucose to gluconic acid (GOX)",
                "Oxidation of homocysteine to homocystine (HCYTO)",
                "Oxidation of lactate to pyruvate (LDH)",
                "Oxidation of menaquinol to menaquinone (MK)",
                "Oxidation of nicotinamide adenine dinucleotide (NAD) to nicotinamide adenine dinucleotide oxidized (NADo)",
                "Oxidation of nicotinamide adenine dinucleotide phosphate (NADP) to nicotinamide adenine dinucleotide phosphate oxidized (NADPo)",
                "Oxidation of nitric oxide to nitrate (NOX)",
                "Oxidation of plastoquinol to plastoquinone (PQ)",
                "Oxidation of riboflavin to flavin mononucleotide (RF)",
                "Oxidation of sulfite to sulfate (SulfO)",
                "Oxidation of tryptophan to kynurenine (TDO)",
                "Oxidation of tyrosine to L-DOPA (TYO)",
                "Oxidation of ubiquinol to ubiquinone (CoQ)",
                "Oxidation of xanthine to uric acid (XO)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "oxidation reaction",
        "domain": "chemistry",
        "response": "error when calling model 'amazon.titan-text-express-v1': empty response",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]