{
    "id": 0,
    "domain": "meta science",
    "workflow_tags": "data cleaning, feature engineering, data selection, data matching, data integration, data deduplication, data standardization, meta regression, summary statistics, data integration",
    "domain_knowledge": "1. When working with multiple studies that are original and replicated, a preprocess & joining step is needed to gather the data required for metaregression analysis. 2. Combining such study data has to account for study & author names and may need multiple heuristics for the ideal join depending on the line of inquiry. 3. An extra step may also be required to handle duplicate values & missing pairs.",
    "datasets": [
        {
            "name": "meta-regression_study_data_heterogeneity_in_replication_projects.csv",
            "description": "Dataset contains information about original & replication studies. Original & replication specific columns may be appended by o & r",
            "columns": {
                "raw": [
                    {
                        "name": "id",
                        "description": "Unique id for each O/R pair"
                    },
                    {
                        "name": "title",
                        "description": "Title of the research study"
                    },
                    {
                        "name": "authors.o",
                        "description": "Names of Original paper's authors"
                    },
                    {
                        "name": "pub_year",
                        "description": "Year of Publication of the study"
                    },
                    {
                        "name": "journal",
                        "description": "Journal in which the study was published"
                    },
                    {
                        "name": "volume",
                        "description": "Volume Number of the journal"
                    },
                    {
                        "name": "issue",
                        "description": "Issue Number of the journal"
                    },
                    {
                        "name": "discipline",
                        "description": "Discipline of original paper. One of the following: Social, Cognitive or Economics"
                    },
                    {
                        "name": "length",
                        "description": "Number of pages of original paper"
                    },
                    {
                        "name": "citations",
                        "description": "Number of citations of original paper"
                    },
                    {
                        "name": "effect_size.o",
                        "description": "Standardized effect size of original paper"
                    },
                    {
                        "name": "p_value.o",
                        "description": "P-value of original paper"
                    },
                    {
                        "name": "n.o",
                        "description": "Sample size of original paper"
                    },
                    {
                        "name": "effect_type",
                        "description": "Type of effect tested. One of the following: main effect, correlation, interaction"
                    },
                    {
                        "name": "effect_size.r",
                        "description": "Standardized effect size of replication"
                    },
                    {
                        "name": "p_value.r",
                        "description": "P-value of replication"
                    },
                    {
                        "name": "n_planned.r",
                        "description": "Planned sample size of replication"
                    },
                    {
                        "name": "n.r",
                        "description": "Sample size of replication"
                    },
                    {
                        "name": "power.o",
                        "description": "Post hoc power based on original effect size"
                    },
                    {
                        "name": "power.r",
                        "description": "Post hoc power based on replication effect size"
                    },
                    {
                        "name": "power_planned.r",
                        "description": "Planned power of the replication based on planned N and original ES"
                    },
                    {
                        "name": "experiment_country.o",
                        "description": "Country where original experiment was conducted"
                    },
                    {
                        "name": "experiment_country.r",
                        "description": "Country where replication is to be conducted"
                    },
                    {
                        "name": "experiment_language.o",
                        "description": "Language used with subjects in original experiment (English, German, Dutch, Polish, Hebrew, French, Italian, Arabic, Spanish, Korean)"
                    },
                    {
                        "name": "experiment_language.r",
                        "description": "Language to be used with subjects in replication (English, Polish, German, Dutch, Italian, Portuguese, Malay, Turkish, Czech, Arabic, Spanish)"
                    },
                    {
                        "name": "online.o",
                        "description": "If the original experiment was conducted online (1: yes, 0: no)"
                    },
                    {
                        "name": "online.r",
                        "description": "If the replication was conducted online (1: yes, 0: no)"
                    },
                    {
                        "name": "compensation.o",
                        "description": "Compensation in original experiment (credit, cash, nothing, mixed)"
                    },
                    {
                        "name": "compensation.r",
                        "description": "Compensation in replication (credit, cash, nothing, mixed)"
                    },
                    {
                        "name": "subjects.o",
                        "description": "Type of subjects used in original experiment (students, online, anyone, community)"
                    },
                    {
                        "name": "subjects.r",
                        "description": "Type of subjects used in replication (students, online, anyone, community)"
                    },
                    {
                        "name": "endprice",
                        "description": "Final market price in prediction market"
                    },
                    {
                        "name": "transactions",
                        "description": "Number of transactions in prediction market"
                    },
                    {
                        "name": "trading_volume",
                        "description": "Total volume of traded stocks in prediction market"
                    },
                    {
                        "name": "replicated",
                        "description": "Binary outcome variable; study is replicated if p <= 0.05 and effect goes in the same direction as the original"
                    },
                    {
                        "name": "project",
                        "description": "The replication project that the study was in (ml1: Many Labs 1, ml3: Many Labs 3, rpp: Psychology, ee: Experimental Economics)"
                    },
                    {
                        "name": "relative_es",
                        "description": "The continuous outcome variable; the standardized replication effect size to the original effect | relative effect size = (replication effect size / original effect size)"
                    },
                    {
                        "name": "n_authors.o",
                        "description": "Number of authors in original study"
                    },
                    {
                        "name": "n_authors.r",
                        "description": "Number of authors in replication"
                    },
                    {
                        "name": "author_citations_avg.o",
                        "description": "Average number of citations of authors in original study"
                    },
                    {
                        "name": "author_citations_max.o",
                        "description": "Number of citations of the author in original study with the highest citation count"
                    },
                    {
                        "name": "authors_male.o",
                        "description": "Ratio of male authors in original study"
                    },
                    {
                        "name": "seniority.o",
                        "description": "Most senior author in the original paper (Professor, Associate Professor, Assistant, Researcher, Assistant Professor)"
                    },
                    {
                        "name": "author_citations_avg.r",
                        "description": "Average number of citations of authors in replication study"
                    },
                    {
                        "name": "author_citations_max.r",
                        "description": "Number of citations of the author in original study with the highest citation count"
                    },
                    {
                        "name": "authors_male.r",
                        "description": "Ratio of male authors in replication"
                    },
                    {
                        "name": "seniority.r",
                        "description": "Most senior author in the original paper (Professor, Associate Professor, Assistant, Researcher, Assistant Professor)"
                    },
                    {
                        "name": "aggregated",
                        "description": "Aggregated column"
                    },
                    {
                        "name": "lab_id",
                        "description": "Unique id for each replication lab"
                    },
                    {
                        "name": "es_80power",
                        "description": "Standardized effect size required in replication to achieve 80% power"
                    },
                    {
                        "name": "same_country",
                        "description": "Original study and replication are in the same country"
                    },
                    {
                        "name": "same_language",
                        "description": "Original study and replication are in the same language"
                    },
                    {
                        "name": "same_online",
                        "description": "Original study and replication are both conducted online"
                    },
                    {
                        "name": "same_subjects",
                        "description": "Original study and replication use same type of subjects"
                    },
                    {
                        "name": "us_lab.o",
                        "description": "Original experiment lab in the US"
                    },
                    {
                        "name": "us_lab.r",
                        "description": "Replication experiment lab in the US"
                    },
                    {
                        "name": "drop",
                        "description": "Drop column"
                    }
                ]
            }
        },
        {
            "name": "meta-regression_replication_success_data_heterogeneity_in_replication_projects.csv",
            "description": "Data from four large-scale replication projects",
            "columns": {
                "raw": [
                    {
                        "name": "study",
                        "description": "Study identifier, usually names of authors from original study"
                    },
                    {
                        "name": "project",
                        "description": "Name of replication project"
                    },
                    {
                        "name": "ro",
                        "description": "Effect estimate of original study on correlation scale"
                    },
                    {
                        "name": "rr",
                        "description": "Effect estimate of replication study on correlation scale"
                    },
                    {
                        "name": "fiso",
                        "description": "Effect estimate of original study transformed to Fisher-z scale"
                    },
                    {
                        "name": "fisr",
                        "description": "Effect estimate of replication study transformed to Fisher-z scale"
                    },
                    {
                        "name": "se_fiso",
                        "description": "Standard error of Fisher-z transformed effect estimate of original study"
                    },
                    {
                        "name": "se_fisr",
                        "description": "Standard error of Fisher-z transformed effect estimate of replication study"
                    },
                    {
                        "name": "po",
                        "description": "Two-sided p-value from significance test of effect estimate from original study"
                    },
                    {
                        "name": "pr",
                        "description": "Two-sided p-value from significance test of effect estimate from replication study"
                    },
                    {
                        "name": "po1",
                        "description": "One-sided p-value from significance test of effect estimate from original study (in the direction of the original effect estimate)"
                    },
                    {
                        "name": "pr1",
                        "description": "One-sided p-value from significance test of effect estimate from replication study (in the direction of the original effect estimate)"
                    },
                    {
                        "name": "pm_belief",
                        "description": "Peer belief about whether replication effect estimate will achieve statistical significance elicited through prediction market (only available for EERP and SSRP)"
                    },
                    {
                        "name": "no",
                        "description": "Sample size in original study"
                    },
                    {
                        "name": "nr",
                        "description": "Sample size in replication study"
                    }
                ]
            }
        }
    ],
    "intermediate": [],
    "hypotheses": {
        "main": [
            {}
        ],
        "intermediate": []
    },
    "queries": [
        [
            {
                "qid": 0,
                "question_type": "relationship",
                "question": "What proportion of original studies in Psychology were conducted in the United States?"
            },
            {
                "qid": 1,
                "question_type": "relationship",
                "question": "What proportion of replication studies in Psychology were conducted in the United States?"
            }
        ]
    ]
}