{
    "id": 2,
    "domain": "jazz music",
    "datasets": [
        {
            "name": "data.csv",
            "description": "Related to improvisation, swing rhythms, and iconic jazz musicians.",
            "columns": [
                {
                    "name": "number_of_improvisations_per_week",
                    "description": "Number of improvisations the musician engages in during performances per week."
                },
                {
                    "name": "latest_album_commercial_success",
                    "description": "Indicates whether the ensemble's latest album was commercially successful (sold over 10,000 copies)."
                },
                {
                    "name": "percentage_sold_out_shows",
                    "description": "The percentage of shows that are fully sold out in a season per venue."
                },
                {
                    "name": "musician_id",
                    "description": "Unique identifier for each musician."
                },
                {
                    "name": "weekend_performance",
                    "description": "Whether the performance is held on a weekend."
                },
                {
                    "name": "international_song_percentage",
                    "description": "Percentage of songs in the ensemble's setlist that are international."
                },
                {
                    "name": "primary_instrument",
                    "description": "The main instrument the musician uses to perform."
                },
                {
                    "name": "performance_complexity",
                    "description": "A quantifiable measure of the improvisational and technical complexity of the artist's performance, scaled from 1 to 10."
                },
                {
                    "name": "uses_swing_rhythms",
                    "description": "Indicator whether swing rhythms are used exclusively by the musician."
                },
                {
                    "name": "marketing_reach",
                    "description": "Binary indicator whether the venue's marketing is local or global."
                },
                {
                    "name": "total_jazz_albums",
                    "description": "Total number of albums released by the musician that primarily feature jazz music."
                },
                {
                    "name": "avg_performance_duration",
                    "description": "Average duration of setlist in hours per performance."
                },
                {
                    "name": "social_media_following",
                    "description": "The total count of followers of the venues official social media accounts."
                },
                {
                    "name": "venue_size",
                    "description": "The capacity of the venue where the musician performs most often."
                },
                {
                    "name": "unique_song_releases_last_year",
                    "description": "Number of unique songs released by the ensemble in the previous year."
                },
                {
                    "name": "festival_participation_count",
                    "description": "Total number of jazz festivals the ensemble has participated in."
                },
                {
                    "name": "average_income_area",
                    "description": "Average income of the area where the venue is located."
                },
                {
                    "name": "ticket_price",
                    "description": "The standard ticket price for the venue."
                },
                {
                    "name": "total_music_awards_won",
                    "description": "Total number of music awards won by the ensemble throughout their career."
                },
                {
                    "name": "jazz_genre_historicity",
                    "description": "Score representing the historic and cultural significance of the artist's primary jazz genre, scaled from 1 to 5."
                },
                {
                    "name": "ensemble_size",
                    "description": "The number of musicians in the ensemble."
                },
                {
                    "name": "stage_presence_intensity",
                    "description": "Quantified measure of the musician's energy and engagement during live performances."
                },
                {
                    "name": "artist_international_collaborations",
                    "description": "Count of distinct international artists the ensemble has collaborated with."
                },
                {
                    "name": "has_international_experience",
                    "description": "Indicates whether the ensemble has performed internationally."
                },
                {
                    "name": "overseas_performance_count",
                    "description": "Total number of performances the ensemble has held outside their home country."
                },
                {
                    "name": "is_lead_instrument",
                    "description": "Indicates if the primary instrument is commonly associated as a jazz lead instrument (e.g., saxophone, trumpet)."
                },
                {
                    "name": "collaboration_count_with_known_jazz_musicians",
                    "description": "Number of collaborations with musicians recognized in the jazz genre."
                },
                {
                    "name": "artist_fame_level",
                    "description": "A scale representing the fame of the artist, ranging from local to international recognition."
                },
                {
                    "name": "genre_specific_events",
                    "description": "Number of genre-specific events (e.g., jazz) the venue hosts annually."
                },
                {
                    "name": "avg_audience_size",
                    "description": "Average audience size per festival."
                },
                {
                    "name": "music_style_complexity",
                    "description": "Count of distinct jazz genres performed by the ensemble."
                },
                {
                    "name": "years_playing_jazz",
                    "description": "Number of years the musician has been actively playing jazz music."
                },
                {
                    "name": "original_compositions",
                    "description": "Binary value indicating whether the artist primarily performs original compositions (True) or covers (False)."
                },
                {
                    "name": "experience_to_improvisation_ratio",
                    "description": "Ratio of years of experience to the number of improvisations per week."
                },
                {
                    "name": "region_jazz_popularity",
                    "description": "Popularity of jazz in the musician's primary active region on a scale from low to high."
                },
                {
                    "name": "years_of_experience",
                    "description": "The number of years the musician has been performing jazz."
                },
                {
                    "name": "venue_type",
                    "description": "The type of venue, categorizing its primary use and setting."
                }
            ]
        }
    ],
    "queries": [
        {
            "qid": 993,
            "question": "Is there a relationship between the primary instrument played by musicians and the size of the venue they perform in?",
            "question_type": "general",
            "difficulty": 1,
            "target_col": "primary_instrument",
            "true_hypothesis": "Musicians who play in larger venues prefer the drums; musicians at outdoor festivals prefer the trumpet. On the other hand, musicians who perform in small jazz clubs tend to play the piano, while those with over 20 years of experience and playing at large venues are more likely to play the bass.",
            "true_hypothesis_expr": "np.where((df['venue_size'] > 1000) & (df['venue_type'] == 'outdoor_festival'), 'trumpet', np.where((df['venue_size'] <= 100) & (df['venue_type'] == 'jazz_club'), 'piano', np.where((df['years_of_experience'] > 20) & (df['venue_size'] > 2000), 'drums', 'bass')))",
            "relevant_cols": [
                "years_of_experience",
                "venue_type",
                "venue_size",
                "primary_instrument"
            ]
        }
    ]
}