{
    "id": 0,
    "domain": "jazz music",
    "datasets": [
        {
            "name": "data.csv",
            "description": "Related to improvisation, swing rhythms, and iconic jazz musicians.",
            "columns": [
                {
                    "name": "genre_specific_events",
                    "description": "Number of genre-specific events (e.g., jazz) the venue hosts annually."
                },
                {
                    "name": "jazz_genre_historicity",
                    "description": "Score representing the historic and cultural significance of the artist's primary jazz genre, scaled from 1 to 5."
                },
                {
                    "name": "avg_performance_duration",
                    "description": "Average duration of setlist in hours per performance."
                },
                {
                    "name": "music_style_complexity",
                    "description": "Count of distinct jazz genres performed by the ensemble."
                },
                {
                    "name": "stage_presence_intensity",
                    "description": "Quantified measure of the musician's energy and engagement during live performances."
                },
                {
                    "name": "number_of_improvisations_per_week",
                    "description": "Number of improvisations the musician engages in during performances per week."
                },
                {
                    "name": "social_media_following",
                    "description": "The total count of followers of the venues official social media accounts."
                },
                {
                    "name": "weekend_performance",
                    "description": "Whether the performance is held on a weekend."
                },
                {
                    "name": "original_compositions",
                    "description": "Binary value indicating whether the artist primarily performs original compositions (True) or covers (False)."
                },
                {
                    "name": "unique_song_releases_last_year",
                    "description": "Number of unique songs released by the ensemble in the previous year."
                },
                {
                    "name": "avg_audience_size",
                    "description": "Average audience size per festival."
                },
                {
                    "name": "years_of_experience",
                    "description": "The number of years the musician has been performing jazz."
                },
                {
                    "name": "latest_album_commercial_success",
                    "description": "Indicates whether the ensemble's latest album was commercially successful (sold over 10,000 copies)."
                },
                {
                    "name": "percentage_sold_out_shows",
                    "description": "The percentage of shows that are fully sold out in a season per venue."
                },
                {
                    "name": "uses_swing_rhythms",
                    "description": "Indicator whether swing rhythms are used exclusively by the musician."
                },
                {
                    "name": "performance_complexity",
                    "description": "A quantifiable measure of the improvisational and technical complexity of the artist's performance, scaled from 1 to 10."
                },
                {
                    "name": "primary_instrument",
                    "description": "The main instrument the musician uses to perform."
                },
                {
                    "name": "total_jazz_albums",
                    "description": "Total number of albums released by the musician that primarily feature jazz music."
                },
                {
                    "name": "musician_id",
                    "description": "Unique identifier for each musician."
                },
                {
                    "name": "total_music_awards_won",
                    "description": "Total number of music awards won by the ensemble throughout their career."
                },
                {
                    "name": "overseas_performance_count",
                    "description": "Total number of performances the ensemble has held outside their home country."
                },
                {
                    "name": "international_song_percentage",
                    "description": "Percentage of songs in the ensemble's setlist that are international."
                },
                {
                    "name": "region_jazz_popularity",
                    "description": "Popularity of jazz in the musician's primary active region on a scale from low to high."
                },
                {
                    "name": "ensemble_size",
                    "description": "The number of musicians in the ensemble."
                },
                {
                    "name": "experience_to_improvisation_ratio",
                    "description": "Ratio of years of experience to the number of improvisations per week."
                },
                {
                    "name": "venue_type",
                    "description": "The type of venue, categorizing its primary use and setting."
                },
                {
                    "name": "years_playing_jazz",
                    "description": "Number of years the musician has been actively playing jazz music."
                },
                {
                    "name": "average_income_area",
                    "description": "Average income of the area where the venue is located."
                }
            ]
        }
    ],
    "queries": [
        {
            "qid": 980,
            "question": "What is the relationship between the usage of swing rhythms, total number of jazz albums, and the region's jazz popularity in determining a musician's 'musician_id' value in this dataset?",
            "question_type": "general",
            "difficulty": 3,
            "target_col": "musician_id",
            "true_hypothesis": "Musicians who have a high ratio of experience to improvisation, collaborated with over 20 known jazz musicians and played jazz for over 10 years are more likely to have higher values in the 'musician_id' column, especially if they use swing rhythms.",
            "true_hypothesis_expr": "10000 * (df['experience_to_improvisation_ratio'] / 50) + 5000 * np.where(((df['total_jazz_albums']*df['stage_presence_intensity']**2 + df['region_jazz_popularity'].map({'low': 1, 'medium': 2, 'high': 3})*10) > 20) & (df['years_playing_jazz'] > 10), True, False) + 3000 * df['uses_swing_rhythms']",
            "relevant_cols": [
                "uses_swing_rhythms",
                "experience_to_improvisation_ratio",
                "years_playing_jazz",
                "stage_presence_intensity",
                "total_jazz_albums",
                "region_jazz_popularity",
                "musician_id"
            ]
        }
    ]
}