{
    "id": 0,
    "domain": "jazz music",
    "datasets": [
        {
            "name": "data.csv",
            "description": "Related to improvisation, swing rhythms, and iconic jazz musicians.",
            "columns": [
                {
                    "name": "avg_audience_size",
                    "description": "Average audience size per festival."
                },
                {
                    "name": "music_style_complexity",
                    "description": "Count of distinct jazz genres performed by the ensemble."
                },
                {
                    "name": "years_playing_jazz",
                    "description": "Number of years the musician has been actively playing jazz music."
                },
                {
                    "name": "has_international_experience",
                    "description": "Indicates whether the ensemble has performed internationally."
                },
                {
                    "name": "venue_type",
                    "description": "The type of venue, categorizing its primary use and setting."
                },
                {
                    "name": "is_lead_instrument",
                    "description": "Indicates if the primary instrument is commonly associated as a jazz lead instrument (e.g., saxophone, trumpet)."
                },
                {
                    "name": "social_media_following",
                    "description": "The total count of followers of the venues official social media accounts."
                },
                {
                    "name": "venue_size",
                    "description": "The capacity of the venue where the musician performs most often."
                },
                {
                    "name": "jazz_genre_historicity",
                    "description": "Score representing the historic and cultural significance of the artist's primary jazz genre, scaled from 1 to 5."
                },
                {
                    "name": "total_jazz_albums",
                    "description": "Total number of albums released by the musician that primarily feature jazz music."
                },
                {
                    "name": "stage_presence_intensity",
                    "description": "Quantified measure of the musician's energy and engagement during live performances."
                },
                {
                    "name": "percentage_sold_out_shows",
                    "description": "The percentage of shows that are fully sold out in a season per venue."
                },
                {
                    "name": "years_of_experience",
                    "description": "The number of years the musician has been performing jazz."
                },
                {
                    "name": "performance_complexity",
                    "description": "A quantifiable measure of the improvisational and technical complexity of the artist's performance, scaled from 1 to 10."
                },
                {
                    "name": "unique_song_releases_last_year",
                    "description": "Number of unique songs released by the ensemble in the previous year."
                },
                {
                    "name": "uses_swing_rhythms",
                    "description": "Indicator whether swing rhythms are used exclusively by the musician."
                },
                {
                    "name": "region_jazz_popularity",
                    "description": "Popularity of jazz in the musician's primary active region on a scale from low to high."
                },
                {
                    "name": "number_of_improvisations_per_week",
                    "description": "Number of improvisations the musician engages in during performances per week."
                },
                {
                    "name": "weekend_performance",
                    "description": "Whether the performance is held on a weekend."
                },
                {
                    "name": "original_compositions",
                    "description": "Binary value indicating whether the artist primarily performs original compositions (True) or covers (False)."
                },
                {
                    "name": "international_song_percentage",
                    "description": "Percentage of songs in the ensemble's setlist that are international."
                },
                {
                    "name": "experience_to_improvisation_ratio",
                    "description": "Ratio of years of experience to the number of improvisations per week."
                },
                {
                    "name": "average_income_area",
                    "description": "Average income of the area where the venue is located."
                },
                {
                    "name": "latest_album_commercial_success",
                    "description": "Indicates whether the ensemble's latest album was commercially successful (sold over 10,000 copies)."
                },
                {
                    "name": "total_music_awards_won",
                    "description": "Total number of music awards won by the ensemble throughout their career."
                },
                {
                    "name": "genre_specific_events",
                    "description": "Number of genre-specific events (e.g., jazz) the venue hosts annually."
                },
                {
                    "name": "avg_performance_duration",
                    "description": "Average duration of setlist in hours per performance."
                },
                {
                    "name": "overseas_performance_count",
                    "description": "Total number of performances the ensemble has held outside their home country."
                }
            ]
        }
    ],
    "queries": [
        {
            "qid": 977,
            "question": "Given a dataset on jazz musicians that includes the years they have been playing jazz, the intensity of their stage presence, the total number of jazz albums they've released, the region's jazz popularity level, and whether their primary instrument is considered a lead jazz instrument, can you identify the key features that predict if a musician's primary instrument is a lead jazz instrument according to a complex relationship involving the total jazz albums, stage presence intensity, region's jazz popularity, years playing jazz, and specific threshold conditions?",
            "question_type": "general",
            "difficulty": 2,
            "target_col": "is_lead_instrument",
            "true_hypothesis": "The likelihood that a musician's primary instrument is considered a lead jazz instrument (e.g., saxophone, trumpet) can be predicted based on the total number of jazz albums released, the intensity of stage presence, the region's jazz popularity, and the musician's years playing jazz, where the product of the total jazz albums and stage presence intensity squared added to ten times the region's jazz popularity (ranging from low to high) surpasses 20, and the musician has been actively playing jazz for over 10 years.",
            "true_hypothesis_expr": "np.where(((df['total_jazz_albums']*df['stage_presence_intensity']**2 + df['region_jazz_popularity'].map({'low': 1, 'medium': 2, 'high': 3})*10) > 20) & (df['years_playing_jazz'] > 10), True, False)",
            "relevant_cols": [
                "years_playing_jazz",
                "stage_presence_intensity",
                "total_jazz_albums",
                "region_jazz_popularity",
                "is_lead_instrument"
            ]
        }
    ]
}