import json
import pandas as pd
from pathlib import Path
from typing import Any, Optional
from mlebench.registry import registry

def read_csv(*args, **kwargs) -> pd.DataFrame:
    """Reads a CSV file and returns a DataFrame with custom default kwargs."""
    try:
        new_default_kwargs = {"float_precision": "round_trip"}
        new_kwargs = {**new_default_kwargs, **kwargs}
        return pd.read_csv(*args, **new_kwargs)
    except pd.errors.EmptyDataError:
        return pd.DataFrame()

def read_jsonl(file_path: str) -> list[dict]:
    """Read a JSONL file and return a list of dictionaries of its content."""
    with open(file_path, "r") as f:
        return [json.loads(line) for line in f]

def load_answers(path_to_answers: Path) -> Any:
    if path_to_answers.suffix == ".csv":
        return read_csv(path_to_answers)

    if path_to_answers.suffix == ".jsonl":
        return read_jsonl(str(path_to_answers))

    raise ValueError(f"Unsupported file format for answers: {path_to_answers}")

class InvalidSubmissionError(Exception):
    pass

class Grader:
    def __init__(self, name: str, grade_fn: Any) -> None:
        self.name = name
        self.grade_fn = grade_fn

    def is_lower_better(self, leaderboard: pd.DataFrame) -> bool:
        scores = leaderboard["score"]
        top_score = scores.iloc[0]
        bottom_score = scores.iloc[-1]
        return bool(top_score < bottom_score)

    def __call__(self, submission: pd.DataFrame, answers: Any) -> Optional[float]:
        try:
            score = self.grade_fn(submission, answers)
        except Exception as e:
            print(f"Error during grading: {e}")
            return None
        return round(score, 5)

    def rank_score(self, score: Optional[float], leaderboard: pd.DataFrame) -> dict:
        if score is None:
            return {
                "gold_medal": False, "silver_medal": False, "bronze_medal": False, "above_median": False,
                "gold_threshold": None, "silver_threshold": None, "bronze_threshold": None, "median_threshold": None
            }

        lower_is_better = self.is_lower_better(leaderboard)
        num_teams = len(leaderboard)
        scores = leaderboard["score"]

        def get_score_at_position(position: int) -> float:
            if position - 1 >= len(scores) or position < 1:
                return scores.iloc[-1]
            return scores.iloc[position - 1]

        def get_thresholds(num_teams: int) -> tuple[float, float, float, float]:
            if 1 <= num_teams < 100:
                gold_threshold = get_score_at_position(max(1, int(num_teams * 0.1)))
                silver_threshold = get_score_at_position(max(1, int(num_teams * 0.2)))
                bronze_threshold = get_score_at_position(max(1, int(num_teams * 0.4)))
            elif 100 <= num_teams < 250:
                gold_threshold = get_score_at_position(10)
                silver_threshold = get_score_at_position(max(1, int(num_teams * 0.2)))
                bronze_threshold = get_score_at_position(max(1, int(num_teams * 0.4)))
            elif 250 <= num_teams < 1000:
                gold_threshold = get_score_at_position(10 + int(num_teams * 0.002))
                silver_threshold = get_score_at_position(50)
                bronze_threshold = get_score_at_position(100)
            else:
                gold_threshold = get_score_at_position(10 + int(num_teams * 0.002))
                silver_threshold = get_score_at_position(50 + int(num_teams * 0.05))
                bronze_threshold = get_score_at_position(100 + int(num_teams * 0.1))
            
            median_threshold = get_score_at_position(int(num_teams * 0.5))
            return gold_threshold, silver_threshold, bronze_threshold, median_threshold

        gold_t, silver_t, bronze_t, median_t = get_thresholds(num_teams)

        if lower_is_better:
            return {
                "gold_medal": score <= gold_t,
                "silver_medal": score <= silver_t,
                "bronze_medal": score <= bronze_t,
                "above_median": score <= median_t,
                "gold_threshold": gold_t, "silver_threshold": silver_t, "bronze_threshold": bronze_t, "median_threshold": median_t
            }
        else:
            return {
                "gold_medal": score >= gold_t,
                "silver_medal": score >= silver_t,
                "bronze_medal": score >= bronze_t,
                "above_median": score >= median_t,
                "gold_threshold": gold_t, "silver_threshold": silver_t, "bronze_threshold": bronze_t, "median_threshold": median_t
            }

def grade_sample(submission_path: Path, competition_id: str):
    competition = registry.get_competition(competition_id)
    
    # Check if dataset is prepared (simplified check)
    if not competition.public_dir.exists() or not competition.private_dir.exists():
        print(f"Dataset for {competition_id} is not prepared.")
        return

    submission_df = read_csv(submission_path)
    answers = load_answers(competition.answers)
    
    # Use the grader from the registry directly, but wrap it if needed or use its call method
    # The registry's grader is already an instance of mlebench.grade_helpers.Grader
    # We can use it directly
    score = competition.grader(submission_df, answers)
    
    if score is None:
        print("Grading failed.")
        return

    leaderboard = pd.read_csv(competition.leaderboard)
    # We need to use our local Grader logic for ranking if we want to be independent, 
    # or we can just use the competition.grader.rank_score if we trust the environment.
    # To be "minimal dependency" but still functional, we'll use the logic we defined above.
    
    # Create a local grader instance just for the rank_score logic
    local_grader = Grader(competition.grader.name, competition.grader.grade_fn)
    rank_info = local_grader.rank_score(score, leaderboard)
    
    report = {
        "competition_id": competition_id,
        "score": float(score) if score is not None else None,
        **{k: bool(v) if isinstance(v, (bool, np.bool_)) else float(v) if isinstance(v, (float, np.floating)) else v for k, v in rank_info.items()}
    }
    
    print(json.dumps(report, indent=4))

if __name__ == "__main__":
    import sys
    import numpy as np
    from mlebench.grade import grade_csv
    if len(sys.argv) < 2:
        print("Usage: python extracted_grader.py <competition_id>")
        sys.exit(1)
    submission_path = Path("experiment/mlebench/competitions")
    competition_id = sys.argv[1]
    submission_path = submission_path / str(competition_id) / "submission.csv"
    competition = registry.get_competition(competition_id)
    # grade_sample(submission_path, competition_id)
    report=grade_csv(submission_path, competition)
    print("Competition report:")
    print(json.dumps(report.to_dict(), indent=4))
    # 保存评分报告到对应竞赛目录
    report_path = submission_path.parent / "grading_report.json"
    with open(report_path, "w", encoding="utf-8") as f:
        json.dump(report.to_dict(), f, indent=4, ensure_ascii=False)
        print(f"Grading report saved to {report_path}")
