{
    "id": 0,
    "domain": "virtual concerts",
    "datasets": [
        {
            "name": "data.csv",
            "description": "Related to online music performances, digital shows, and live streaming.",
            "columns": [
                {
                    "name": "artist_time_zone",
                    "description": "Primary time zone of the featured artists."
                },
                {
                    "name": "interactive_features_available",
                    "description": "Indicates whether interactive features (e.g., live polling, request a song) were available during the concert"
                },
                {
                    "name": "engagement_rate",
                    "description": "The percentage of engaged users among the viewers."
                },
                {
                    "name": "interactive_elements",
                    "description": "Indicates if the virtual concert incorporated interactive features such as live chats, polls, or viewer choices."
                },
                {
                    "name": "concert_length_minutes",
                    "description": "Total duration of the concert in minutes."
                },
                {
                    "name": "advertising_budget",
                    "description": "The amount of money spent on advertising the virtual concert."
                },
                {
                    "name": "engagement_score",
                    "description": "Numerical score representing the level of engagement with the virtual concert."
                },
                {
                    "name": "artist_age_group",
                    "description": "The predominant age group of the artist's audience."
                },
                {
                    "name": "guest_artist_present",
                    "description": "Indicates whether guest artists performed during the concert."
                },
                {
                    "name": "production_team_size",
                    "description": "The number of individuals in the production team organizing the concert."
                },
                {
                    "name": "streaming_platform",
                    "description": "The platform on which the virtual concert was hosted."
                },
                {
                    "name": "audience_reach",
                    "description": "Estimated number of potential viewers for the concert from around the world."
                },
                {
                    "name": "target_audience_diversity",
                    "description": "A binary indicator where 1 represents high diversity of the target audience in terms of global distribution and 0 represents low diversity."
                },
                {
                    "name": "streaming_platforms_count",
                    "description": "Number of different digital platforms where the concert will be streamed."
                },
                {
                    "name": "concert_time_slot",
                    "description": "The time slot of the concert, categorized as morning, afternoon, or evening."
                },
                {
                    "name": "concert_genre",
                    "description": "Musical genre of the concert."
                },
                {
                    "name": "total_viewer_count",
                    "description": "Total number of people who watched the concert online."
                },
                {
                    "name": "exclusive_content_offered",
                    "description": "Whether exclusive downloadable content was offered with the concert ticket."
                }
            ]
        }
    ],
    "queries": [
        {
            "qid": 662,
            "question": "Is there a relationship between the engagement score of virtual concerts with predominantly Gen Z audiences and the time slot the concert is scheduled during, the presence of interactive elements, the advertising budget, the artist's time zone, and the day of the week?",
            "question_type": "general",
            "difficulty": 3,
            "target_col": "engagement_score",
            "true_hypothesis": "Artists with predominantly Gen Z audiences will see a 40% higher engagement score when the virtual concert incorporates interactive elements, the advertising budget is above 50000 and the artist's time zone is 'UTC', and the concert is scheduled during the evening time slot on Friday as opposed to Wednesday.",
            "true_hypothesis_expr": "df['interactive_elements'].astype(int) * (np.where((df['advertising_budget'] > 50000) & (df['artist_time_zone'] == 'UTC'), True, False)).astype(int) * 1000 + 500 * (np.where(np.where((df['interactive_elements'] == True) & (df['concert_time_slot'] == 'evening'), 'Friday', 'Wednesday').isin(['Monday', 'Tuesday', 'Wednesday', 'Thursday', 'Friday']), 1.4, 1)) * (np.where(df['artist_age_group'] == 'Gen Z', 1.4, 1))",
            "relevant_cols": [
                "concert_time_slot",
                "interactive_elements",
                "advertising_budget",
                "artist_time_zone",
                "artist_age_group",
                "engagement_score"
            ]
        }
    ]
}