{
    "id": 0,
    "domain": "sociology",
    "workflow_tags": "regression",
    "domain_knowledge": "Spending and saving behavior can be used as proxies for Time preference of an individual.",
    "datasets": [
        {
            "name": "nls_bmi_processed.csv",
            "description": "This dataset is from the National Longitudinal Survey of Youth (NLSY79) includes variables such as gender, age, income, savings behavior, BMI, and racial background.",
            "max_depth": 0,
            "columns": {
                "raw": [
                    {
                        "name": "GENDER",
                        "description": "Gender of the Respondent (MALE or FEMALE)",
                        "depth": 0
                    },
                    {
                        "name": "AGE",
                        "description": "The age of the respondent in the year 1989",
                        "depth": 0
                    },
                    {
                        "name": "AGE_2",
                        "description": "Square of the age of the Respondent",
                        "depth": 0
                    },
                    {
                        "name": "INCOME",
                        "description": "The income of the respondent in the year 1989",
                        "depth": 0
                    },
                    {
                        "name": "DISSAVED",
                        "description": "A boolean variable that equals 1 if the respondent took more money out of than put into savings and equals 0 otherwise",
                        "depth": 0
                    },
                    {
                        "name": "SAMESAVE",
                        "description": "A boolean variable that equals 1 if the respondent's savings level did not change or the respondent had no savings, and is 0 otherwise",
                        "depth": 0
                    },
                    {
                        "name": "BMI",
                        "description": "Body mass index of the respondent calculated using the standard formula using the height and weight of the respondent using the height of 1985 and weight of 1989",
                        "depth": 0
                    },
                    {
                        "name": "BLACK",
                        "description": "A boolean variable that indicated if the respondent belongs to the black race or not",
                        "depth": 0
                    },
                    {
                        "name": "HISPANIC",
                        "description": "A boolean variable that indicated if the respondent belongs to the hispanic race or not",
                        "depth": 0
                    }
                ]
            }
        }
    ],
    "intermediate": [],
    "hypotheses": {
        "main": [
            {
                "depth": 0,
                "target": "",
                "expr": "",
                "expr_ind": "",
                "text": "Higher time preference associated with higher BMI for 1989 data. BMI is postively related with if person spent more than their saving with a coefficient 0.3596. BMI is also positively correlated with if the savings of a person remained unchaged with a coefficient 0.4858."
            }
        ],
        "intermediate": []
    },
    "workflow": "1. Chose BMI as dependent variable.\n2. Time preference (independent) variables as 'DISSAVED' and 'SAMESAVE'.\n3. Fit an OLS regression model and returned the model summary.",
    "queries": [
        [
            {
                "qid": 0,
                "true_hypothesis": "Higher time preference associated with higher BMI for 1989 data. BMI is postively related with if person spent more than their saving with a coefficient 0.3596. BMI is also positively correlated with if the savings of a person remained unchaged with a coefficient 0.4858.",
                "question_type": "variables",
                "question": "What are the factors related to time preference associated with higher BMI in the 1989 data?"
            },
            {
                "qid": 1,
                "true_hypothesis": "Higher time preference associated with higher BMI for 1989 data. BMI is postively related with if person spent more than their saving with a coefficient 0.3596. BMI is also positively correlated with if the savings of a person remained unchaged with a coefficient 0.4858.",
                "question_type": "relationship",
                "question": "How is higher time preference related to BMI in the 1989 data?"
            }
        ]
    ]
}