{
    "@context": {
        "@language": "en",
        "@vocab": "https://schema.org/",
        "citeAs": "cr:citeAs",
        "column": "cr:column",
        "conformsTo": "dct:conformsTo",
        "cr": "http://mlcommons.org/croissant/",
        "data": {
            "@id": "cr:data",
            "@type": "@json"
        },
        "dataType": {
            "@id": "cr:dataType",
            "@type": "@vocab"
        },
        "dct": "http://purl.org/dc/terms/",
        "examples": {
            "@id": "cr:examples",
            "@type": "@json"
        },
        "extract": "cr:extract",
        "field": "cr:field",
        "fileObject": "cr:fileObject",
        "fileProperty": "cr:fileProperty",
        "fileSet": "cr:fileSet",
        "format": "cr:format",
        "includes": "cr:includes",
        "isLiveDataset": "cr:isLiveDataset",
        "jsonPath": "cr:jsonPath",
        "key": "cr:key",
        "md5": "cr:md5",
        "parentField": "cr:parentField",
        "path": "cr:path",
        "rai": "http://mlcommons.org/croissant/RAI/",
        "recordSet": "cr:recordSet",
        "references": "cr:references",
        "regex": "cr:regex",
        "repeated": "cr:repeated",
        "replace": "cr:replace",
        "sc": "https://schema.org/",
        "separator": "cr:separator",
        "source": "cr:source",
        "subField": "cr:subField",
        "transform": "cr:transform"
    },
    "@type": "sc:Dataset",
    "citeAs": "@article{bao2024towards,\ntitle={Towards the prediction of drug solubility in binary solvent mixtures at various temperatures using machine learning},\nauthor={Bao, Zeqing and Tom, Gary and Cheng, Austin and Watchorn, Jeffrey and Aspuru-Guzik, Al{'a}n and Allen, Christine},\njournal={Journal of Cheminformatics},\nvolume={16},\nnumber={1},\npages={117},\nyear={2024},\npublisher={Springer}\n}\n",
    "conformsTo": "http://mlcommons.org/croissant/1.0",
    "datePublished": "2026-05-15 00:00:00",
    "description": "Dataset of drug solubility values (e.g., g/100g solvent) measured in various binary or ternary solvent mixtures at different temperatures.",
    "distribution": [
        {
            "@id": "github-repository",
            "@type": "cr:FileObject",
            "contentUrl": "https://github.com/chemcognition-lab/chemixhub",
            "description": "CheMixHub github repo.",
            "encodingFormat": "git+https",
            "name": "github-repository",
            "sha256": "main"
        },
        {
            "@id": "compounds.csv",
            "@type": "cr:FileObject",
            "contentUrl": "https://raw.githubusercontent.com/chemcognition-lab/chemixhub/refs/heads/main/datasets/drug-solubility/processed_data/compounds.csv",
            "description": "Single compounds",
            "encodingFormat": "text/csv",
            "name": "compounds.csv",
            "sha256": "ee74a0fb288f4c402dce14fce0b2fb8ffbc51a5e343b7121df0d2fe215a5db50"
        },
        {
            "@id": "mixtures.csv",
            "@type": "cr:FileObject",
            "contentUrl": "https://raw.githubusercontent.com/chemcognition-lab/chemixhub/refs/heads/main/datasets/drug-solubility/processed_data/processed_DrugSolubilityData.csv",
            "description": "Mixture definition",
            "encodingFormat": "text/csv",
            "name": "mixtures.csv",
            "sha256": "3f1a1a9d9b9a296fed8b1dc288f4f644535a76f3c4a5a486ad52d44d20ad669a"
        }
    ],
    "license": "https://creativecommons.org/licenses/by/4.0/",
    "name": "drug-solubility",
    "recordSet": [
        {
            "@id": "Compounds",
            "@type": "cr:RecordSet",
            "field": [
                {
                    "@id": "compound_id",
                    "@type": "cr:Field",
                    "dataType": "sc:Integer",
                    "description": "Index for compounds to reference with mixtures",
                    "name": "compound_id",
                    "source": {
                        "extract": {
                            "column": "compound_id"
                        },
                        "fileSet": {
                            "@id": "compounds.csv"
                        }
                    }
                },
                {
                    "@id": "smiles",
                    "@type": "cr:Field",
                    "dataType": "sc:Text",
                    "description": "isomeric canonical smiles",
                    "name": "smles",
                    "source": {
                        "extract": {
                            "column": "smiles"
                        },
                        "fileSet": {
                            "@id": "compounds.csv"
                        }
                    }
                },
                {
                    "@id": "name",
                    "@type": "cr:Field",
                    "dataType": "sc:Text",
                    "description": "Compound name",
                    "name": "name",
                    "source": {
                        "extract": {
                            "column": "name"
                        },
                        "fileSet": {
                            "@id": "compounds.csv"
                        }
                    }
                },
                {
                    "@id": "salt",
                    "@type": "cr:Field",
                    "dataType": "sc:Boolean",
                    "description": "Does the molecule have a salt?",
                    "name": "salt",
                    "source": {
                        "extract": {
                            "column": "salt"
                        },
                        "fileSet": {
                            "@id": "compounds.csv"
                        }
                    }
                }
            ],
            "name": "Compounds"
        },
        {
            "@id": "Mixtures",
            "@type": "cr:RecordSet",
            "field": [
                {
                    "@id": "value",
                    "@type": "cr:Field",
                    "dataType": "sc:Float",
                    "description": "Value",
                    "name": "value",
                    "source": {
                        "extract": {
                            "column": "value"
                        },
                        "fileSet": {
                            "@id": "mixtures.csv"
                        }
                    }
                },
                {
                    "@id": "Temperature_K",
                    "@type": "cr:Field",
                    "dataType": "sc:Float",
                    "description": "Temperature, K",
                    "name": "Temperature_K",
                    "source": {
                        "extract": {
                            "column": "Temperature, K"
                        },
                        "fileSet": {
                            "@id": "mixtures.csv"
                        }
                    }
                },
                {
                    "@id": "property",
                    "@type": "cr:Field",
                    "dataType": "sc:Text",
                    "description": "Property measured",
                    "name": "property",
                    "source": {
                        "extract": {
                            "column": "property"
                        },
                        "fileSet": {
                            "@id": "mixtures.csv"
                        }
                    }
                },
                {
                    "@id": "unit",
                    "@type": "cr:Field",
                    "dataType": "sc:Text",
                    "description": "Property units",
                    "name": "unit",
                    "source": {
                        "extract": {
                            "column": "unit"
                        },
                        "fileSet": {
                            "@id": "mixtures.csv"
                        }
                    }
                },
                {
                    "@id": "cmp_ids_solvent",
                    "@type": "cr:Field",
                    "dataType": "sc:Text",
                    "description": "Compound ids for solvent",
                    "name": "cmp_ids_solvent",
                    "source": {
                        "extract": {
                            "column": "cmp_ids_solvent"
                        },
                        "fileSet": {
                            "@id": "mixtures.csv"
                        }
                    }
                },
                {
                    "@id": "cmp_mole_fractions_solvent",
                    "@type": "cr:Field",
                    "dataType": "sc:Text",
                    "description": "Compound fractions for solvent",
                    "name": "cmp_mole_fractions_solvent",
                    "source": {
                        "extract": {
                            "column": "cmp_mole_fractions_solvent"
                        },
                        "fileSet": {
                            "@id": "mixtures.csv"
                        }
                    }
                },
                {
                    "@id": "cmp_ids_drug",
                    "@type": "cr:Field",
                    "dataType": "sc:Text",
                    "description": "Compound ids for drug",
                    "name": "cmp_ids_drug",
                    "source": {
                        "extract": {
                            "column": "cmp_ids_drug"
                        },
                        "fileSet": {
                            "@id": "mixtures.csv"
                        }
                    }
                },
                {
                    "@id": "cmp_mole_fractions_drug",
                    "@type": "cr:Field",
                    "dataType": "sc:Text",
                    "description": "Compound fractions for drug",
                    "name": "cmp_mole_fractions_drug",
                    "source": {
                        "extract": {
                            "column": "cmp_mole_fractions_drug"
                        },
                        "fileSet": {
                            "@id": "mixtures.csv"
                        }
                    }
                }
            ],
            "name": "Mixtures"
        }
    ],
    "url": "https://github.com/chemcognition-lab/chemixhub",
    "version": "0.99"
}
