{
    "id": 2,
    "domain": "jazz music",
    "datasets": [
        {
            "name": "data.csv",
            "description": "Related to improvisation, swing rhythms, and iconic jazz musicians.",
            "columns": [
                {
                    "name": "jazz_genre_historicity",
                    "description": "Score representing the historic and cultural significance of the artist's primary jazz genre, scaled from 1 to 5."
                },
                {
                    "name": "primary_instrument",
                    "description": "The main instrument the musician uses to perform."
                },
                {
                    "name": "musician_id",
                    "description": "Unique identifier for each musician."
                },
                {
                    "name": "original_compositions",
                    "description": "Binary value indicating whether the artist primarily performs original compositions (True) or covers (False)."
                },
                {
                    "name": "ensemble_size",
                    "description": "The number of musicians in the ensemble."
                },
                {
                    "name": "years_playing_jazz",
                    "description": "Number of years the musician has been actively playing jazz music."
                },
                {
                    "name": "music_style_complexity",
                    "description": "Count of distinct jazz genres performed by the ensemble."
                },
                {
                    "name": "marketing_reach",
                    "description": "Binary indicator whether the venue's marketing is local or global."
                },
                {
                    "name": "collaboration_count_with_known_jazz_musicians",
                    "description": "Number of collaborations with musicians recognized in the jazz genre."
                },
                {
                    "name": "overseas_performance_count",
                    "description": "Total number of performances the ensemble has held outside their home country."
                },
                {
                    "name": "unique_song_releases_last_year",
                    "description": "Number of unique songs released by the ensemble in the previous year."
                },
                {
                    "name": "ticket_price",
                    "description": "The standard ticket price for the venue."
                },
                {
                    "name": "artist_fame_level",
                    "description": "A scale representing the fame of the artist, ranging from local to international recognition."
                },
                {
                    "name": "experience_to_improvisation_ratio",
                    "description": "Ratio of years of experience to the number of improvisations per week."
                },
                {
                    "name": "avg_audience_size",
                    "description": "Average audience size per festival."
                },
                {
                    "name": "number_of_improvisations_per_week",
                    "description": "Number of improvisations the musician engages in during performances per week."
                },
                {
                    "name": "percentage_sold_out_shows",
                    "description": "The percentage of shows that are fully sold out in a season per venue."
                },
                {
                    "name": "uses_swing_rhythms",
                    "description": "Indicator whether swing rhythms are used exclusively by the musician."
                },
                {
                    "name": "latest_album_commercial_success",
                    "description": "Indicates whether the ensemble's latest album was commercially successful (sold over 10,000 copies)."
                },
                {
                    "name": "festival_participation_count",
                    "description": "Total number of jazz festivals the ensemble has participated in."
                },
                {
                    "name": "artist_international_collaborations",
                    "description": "Count of distinct international artists the ensemble has collaborated with."
                },
                {
                    "name": "total_jazz_albums",
                    "description": "Total number of albums released by the musician that primarily feature jazz music."
                },
                {
                    "name": "average_income_area",
                    "description": "Average income of the area where the venue is located."
                },
                {
                    "name": "weekend_performance",
                    "description": "Whether the performance is held on a weekend."
                },
                {
                    "name": "region_jazz_popularity",
                    "description": "Popularity of jazz in the musician's primary active region on a scale from low to high."
                },
                {
                    "name": "performance_complexity",
                    "description": "A quantifiable measure of the improvisational and technical complexity of the artist's performance, scaled from 1 to 10."
                },
                {
                    "name": "international_song_percentage",
                    "description": "Percentage of songs in the ensemble's setlist that are international."
                },
                {
                    "name": "years_of_experience",
                    "description": "The number of years the musician has been performing jazz."
                },
                {
                    "name": "genre_specific_events",
                    "description": "Number of genre-specific events (e.g., jazz) the venue hosts annually."
                },
                {
                    "name": "avg_performance_duration",
                    "description": "Average duration of setlist in hours per performance."
                },
                {
                    "name": "social_media_following",
                    "description": "The total count of followers of the venues official social media accounts."
                },
                {
                    "name": "venue_type",
                    "description": "The type of venue, categorizing its primary use and setting."
                },
                {
                    "name": "stage_presence_intensity",
                    "description": "Quantified measure of the musician's energy and engagement during live performances."
                },
                {
                    "name": "total_music_awards_won",
                    "description": "Total number of music awards won by the ensemble throughout their career."
                }
            ]
        }
    ],
    "queries": [
        {
            "qid": 994,
            "question": "Is there a relationship between the primary instrument played and the venue type for jazz musicians with over 20 years of experience?",
            "question_type": "general",
            "difficulty": 2,
            "target_col": "primary_instrument",
            "true_hypothesis": "Musicians who play in larger venues prefer the drums; musicians at outdoor festivals prefer the trumpet. In contrast, musicians who perform in small jazz clubs tend to play the piano. Artists with over 20 years of experience playing at large venues are more likely to play the drums.",
            "true_hypothesis_expr": "np.where((500 * df['artist_fame_level'] + 10 * df['ticket_price'] + 2000 * df['marketing_reach'].astype(int) > 1000) & (df['venue_type'] == 'outdoor_festival'), 'trumpet', np.where((500 * df['artist_fame_level'] + 10 * df['ticket_price'] + 2000 * df['marketing_reach'].astype(int) <= 100) & (df['venue_type'] == 'jazz_club'), 'piano', np.where((df['years_of_experience'] > 20) & (500 * df['artist_fame_level'] + 10 * df['ticket_price'] + 2000 * df['marketing_reach'].astype(int) > 2000), 'drums', 'bass')))",
            "relevant_cols": [
                "years_of_experience",
                "venue_type",
                "artist_fame_level",
                "ticket_price",
                "marketing_reach",
                "primary_instrument"
            ]
        }
    ]
}