{
    "id": 1,
    "domain": "jazz music",
    "datasets": [
        {
            "name": "data.csv",
            "description": "Related to improvisation, swing rhythms, and iconic jazz musicians.",
            "columns": [
                {
                    "name": "jazz_genre_historicity",
                    "description": "Score representing the historic and cultural significance of the artist's primary jazz genre, scaled from 1 to 5."
                },
                {
                    "name": "primary_instrument",
                    "description": "The main instrument the musician uses to perform."
                },
                {
                    "name": "musician_id",
                    "description": "Unique identifier for each musician."
                },
                {
                    "name": "original_compositions",
                    "description": "Binary value indicating whether the artist primarily performs original compositions (True) or covers (False)."
                },
                {
                    "name": "ensemble_size",
                    "description": "The number of musicians in the ensemble."
                },
                {
                    "name": "years_playing_jazz",
                    "description": "Number of years the musician has been actively playing jazz music."
                },
                {
                    "name": "music_style_complexity",
                    "description": "Count of distinct jazz genres performed by the ensemble."
                },
                {
                    "name": "marketing_reach",
                    "description": "Binary indicator whether the venue's marketing is local or global."
                },
                {
                    "name": "collaboration_count_with_known_jazz_musicians",
                    "description": "Number of collaborations with musicians recognized in the jazz genre."
                },
                {
                    "name": "overseas_performance_count",
                    "description": "Total number of performances the ensemble has held outside their home country."
                },
                {
                    "name": "unique_song_releases_last_year",
                    "description": "Number of unique songs released by the ensemble in the previous year."
                },
                {
                    "name": "ticket_price",
                    "description": "The standard ticket price for the venue."
                },
                {
                    "name": "artist_fame_level",
                    "description": "A scale representing the fame of the artist, ranging from local to international recognition."
                },
                {
                    "name": "experience_to_improvisation_ratio",
                    "description": "Ratio of years of experience to the number of improvisations per week."
                },
                {
                    "name": "avg_audience_size",
                    "description": "Average audience size per festival."
                },
                {
                    "name": "number_of_improvisations_per_week",
                    "description": "Number of improvisations the musician engages in during performances per week."
                },
                {
                    "name": "percentage_sold_out_shows",
                    "description": "The percentage of shows that are fully sold out in a season per venue."
                },
                {
                    "name": "uses_swing_rhythms",
                    "description": "Indicator whether swing rhythms are used exclusively by the musician."
                },
                {
                    "name": "latest_album_commercial_success",
                    "description": "Indicates whether the ensemble's latest album was commercially successful (sold over 10,000 copies)."
                },
                {
                    "name": "festival_participation_count",
                    "description": "Total number of jazz festivals the ensemble has participated in."
                },
                {
                    "name": "artist_international_collaborations",
                    "description": "Count of distinct international artists the ensemble has collaborated with."
                },
                {
                    "name": "total_jazz_albums",
                    "description": "Total number of albums released by the musician that primarily feature jazz music."
                },
                {
                    "name": "average_income_area",
                    "description": "Average income of the area where the venue is located."
                },
                {
                    "name": "weekend_performance",
                    "description": "Whether the performance is held on a weekend."
                },
                {
                    "name": "region_jazz_popularity",
                    "description": "Popularity of jazz in the musician's primary active region on a scale from low to high."
                },
                {
                    "name": "performance_complexity",
                    "description": "A quantifiable measure of the improvisational and technical complexity of the artist's performance, scaled from 1 to 10."
                },
                {
                    "name": "international_song_percentage",
                    "description": "Percentage of songs in the ensemble's setlist that are international."
                },
                {
                    "name": "years_of_experience",
                    "description": "The number of years the musician has been performing jazz."
                },
                {
                    "name": "genre_specific_events",
                    "description": "Number of genre-specific events (e.g., jazz) the venue hosts annually."
                },
                {
                    "name": "avg_performance_duration",
                    "description": "Average duration of setlist in hours per performance."
                },
                {
                    "name": "social_media_following",
                    "description": "The total count of followers of the venues official social media accounts."
                },
                {
                    "name": "venue_type",
                    "description": "The type of venue, categorizing its primary use and setting."
                },
                {
                    "name": "stage_presence_intensity",
                    "description": "Quantified measure of the musician's energy and engagement during live performances."
                },
                {
                    "name": "total_music_awards_won",
                    "description": "Total number of music awards won by the ensemble throughout their career."
                }
            ]
        }
    ],
    "queries": [
        {
            "qid": 986,
            "question": "Can we determine any trends between the complexity of jazz music styles performed by ensembles, the duration of their performances, and the number of international collaborations with their average audience size and ensemble size?",
            "question_type": "general",
            "difficulty": 2,
            "target_col": "ensemble_size",
            "true_hypothesis": "For jazz ensembles, the complexity of the music style (counted by number of distinct jazz genres performed), the average setlist performance duration, and the number of festival participations, along with a calculated factor based on international collaborations and audience size, are key determinants of ensemble size. Ensembles that play more complex styles, have longer performances, participate in more festivals, collaborate internationally, and attract larger audiences generally have more musicians.",
            "true_hypothesis_expr": "df['music_style_complexity'] + 2 * df['avg_performance_duration'] * (np.where(df['artist_international_collaborations'] + 2 * df['festival_participation_count'] ** 2 / df['avg_audience_size'] > 50, True, False).astype(int) + 3",
            "relevant_cols": [
                "music_style_complexity",
                "avg_performance_duration",
                "avg_audience_size",
                "artist_international_collaborations",
                "festival_participation_count",
                "ensemble_size"
            ]
        }
    ]
}