{
    "id": 0,
    "domain": "biology",
    "workflow_tags": "regression",
    "domain_knowledge": "",
    "datasets": [
        {
            "name": "body-size-evolution-in-south-american-freshwater-fishes.csv",
            "description": "This dataset contains the drivers of speciation rates in South American freshwater fishes, employing an integrative approach that considers multiple biotic and abiotic factors.",
            "max_depth": 0,
            "columns": {
                "raw": [
                    {
                        "name": "HYBAS_ID",
                        "description": "Identifier for hydrological basins as defined by the HydroBASINS framework",
                        "depth": 0
                    },
                    {
                        "name": "long",
                        "description": "The longitude for specific geographic locations used to map the presence/absence of species.",
                        "depth": 0
                    },
                    {
                        "name": "lat",
                        "description": "The latitude for specific geographic locations used to map the presence/absence of species.",
                        "depth": 0
                    },
                    {
                        "name": "BAMM_speciation",
                        "description": "This variable represents the average speciation rates of species within each sub-basin, as estimated by BAMM",
                        "depth": 0
                    },
                    {
                        "name": "BAMM_extinction",
                        "description": "This variable represents the mean extinction rates for each tip of the phylogenetic tree, as estimated by the BAMM analysis",
                        "depth": 0
                    },
                    {
                        "name": "BAMM_NetDiv",
                        "description": "This variable stands for the net diversification rates, which are calculated by subtracting the mean extinction rates from the mean \nspeciation rates for each tip in the phylogenetic tree.",
                        "depth": 0
                    },
                    {
                        "name": "DR",
                        "description": "Diversification Rate, a transformed measure of evolutionary distinctness to understand phylogenetic diversity. The lower the \"ed\" value, the higher the \"DR\" metric, indicating a species with less unique evolutionary history compared to others in the phylogeny.",
                        "depth": 0
                    },
                    {
                        "name": "BEL_evol",
                        "description": "Rates of Body Elongation evolution",
                        "depth": 0
                    },
                    {
                        "name": "MBL_evol",
                        "description": "Rates of Maximum Body Length evolution",
                        "depth": 0
                    },
                    {
                        "name": "OGP_evol",
                        "description": "Rates of Oral Gape Position Evolution",
                        "depth": 0
                    },
                    {
                        "name": "RES_evol",
                        "description": "Rates of Relative Eye Size Evolution",
                        "depth": 0
                    },
                    {
                        "name": "RML_evol",
                        "description": "Rate of Relative Maxillary Length evolution",
                        "depth": 0
                    },
                    {
                        "name": "bio1",
                        "description": "This variable represents the annual mean temperature.",
                        "depth": 0
                    },
                    {
                        "name": "bio12",
                        "description": "This variable represents the annual mean precipitation.",
                        "depth": 0
                    },
                    {
                        "name": "runoff",
                        "description": "This variable is used to represent the quantity of water from precipitation that flows over the land's surface and does not get absorbed into the ground. It is being extracted from a geographic database (HydroAtlas).",
                        "depth": 0
                    },
                    {
                        "name": "aet",
                        "description": "Actual evapotranspiration, which is the sum of evaporation and plant transpiration from the Earth's land and ocean surface to the atmosphere.",
                        "depth": 0
                    },
                    {
                        "name": "Elevation",
                        "description": "Mean elevation data indicating the height above sea level.",
                        "depth": 0
                    },
                    {
                        "name": "sgr",
                        "description": "Stream gradient is a measure of the steepness or incline of a stream or river. It can affect water flow and sediment transport, which in turn can influence the habitat conditions for freshwater species. Higher stream gradients usually correspond to faster-moving \nwater and can create different ecological conditions compared to lower gradients.",
                        "depth": 0
                    },
                    {
                        "name": "soil_div",
                        "description": "It measures the diversity of soil types or conditions within each sub-basin studied. Soil diversity is computed using a dataset that includes eight variables related to substrate types and soil conditions.",
                        "depth": 0
                    },
                    {
                        "name": "area",
                        "description": "The geographic area of a sub-basin, possibly in square meters, used as one of the predictors in the analysis.",
                        "depth": 0
                    },
                    {
                        "name": "diversity",
                        "description": "Species diversity, which in ecological studies typically refers to the number of species and their relative abundances in a given area.",
                        "depth": 0
                    }
                ]
            }
        }
    ],
    "intermediate": [],
    "hypotheses": {
        "main": [
            {
                "depth": 0,
                "target": "",
                "expr": "",
                "expr_ind": "",
                "text": "The rate of maximum body length evolution emerged as the most influential factor explaining spatial variation in speciation rates. The relationship is positive with linear coefficient 0.82."
            }
        ],
        "intermediate": []
    },
    "workflow": "1. OLS Regression with 10 independent varialbes\n['RML_evol','MBL_evol','OGP_evol','BEL_evol','diversity','runoff','Elevation','sgr','soil_div','area']\n2. And 'BAMM_speciation' as the dependent variable",
    "queries": [
        [
            {
                "qid": 0,
                "true_hypothesis": "The rate of maximum body length evolution emerged as the most influential factor explaining spatial variation in speciation rates. The relationship is positive with linear coefficient 0.82.",
                "question_type": "variable",
                "question": "Is the maximum body length evolution the most impactful factor in explaining the speciation rates?"
            },
            {
                "qid": 1,
                "true_hypothesis": "The rate of maximum body length evolution emerged as the most influential factor explaining spatial variation in speciation rates. The relationship is positive with linear coefficient 0.82.",
                "question_type": "variable",
                "question": "What explained the spatial variation in speciation rates, where the rate of maximum body length evolution was identified as the most influential factor with a positive relationship coefficient of 0.82?"
            },
            {
                "qid": 2,
                "true_hypothesis": "The rate of maximum body length evolution emerged as the most influential factor explaining spatial variation in speciation rates. The relationship is positive with linear coefficient 0.82.",
                "question_type": "relationhsip",
                "question": "What is the linear coefficient that describes the positive relationship between the rate of maximum body length evolution and spatial variation in speciation rates, where the former emerges as the most influential factor?"
            }
        ]
    ]
}