#!/usr/bin/python3
"""
Genomics of Drug Sensitivity in Cancer (GDSC) Knowledge Bource.

Author(s):
    Anonymized Authors @anonymized-authors

Citation(s):
    [1] Garnett M, Edelman E, Heidorn S, et al. Systematic identification of
        genomic markers of drug sensitivity in cancer cells. Nature 483:
        570-5 (2012). doi: 10.1038/nature11005
    [2] Iorio F, Knijnenburg TA, Vis DJ, et al. A landscape of pharmacogenomic
        interactions in cancer. Cell 166(3): 740-54. (2016). doi:
        10.1016/j.cell.2016.06.017
    [3] Yang W, Soares J, Greninger P, et al. Genomics of drug sensitivity
        in cancer (GDSC): A resource for therapeutic biomarker discovery in
        cancer cells. Nucleic Acids Res 41(D1): D955-61 (2013). doi:
        10.1093/nar/gks1111

Licensed under the Apache License, Version 2.0. Copyright Anonymized, Inc. 2025.
"""
import pandas as pd
from typing import Any, Dict, List, Optional

from .base import BioEntity, KnowledgeBase


class DrugName(BioEntity):
    def __new__(cls, name: str, synonyms: Optional[List[str]] = None):
        """
        Args:
            name: the official name of the cell.
            synonyms: optional synonyms of the cell.
        """
        return BioEntity("drug", name, synonyms)


class GDSCKnowledgeBase(KnowledgeBase):
    url: str = (
        "https://cog.sanger.ac.uk/cancerrxgene/GDSC_release8.5/"
        "screened_compounds_rel_8.5.csv"
    )

    def __init__(self, *args: Any, **kwargs: Dict[str, Any]):
        """
        Args:
            None.
        """
        del args, kwargs
        super(GDSCKnowledgeBase, self).__init__(top_k=1)
        self.data = {}
        for _, row in pd.read_csv(self.url).iterrows():
            synonyms = None
            if row["SYNONYMS"] is not None and (
                isinstance(row["SYNONYMS"], list) and len(row["SYNONYMS"])
            ):
                synonyms = row["SYNONYMS"].split(", ")
            target = str(row["TARGET"])
            if row["TARGET_PATHWAY"] != "Other":
                target += " in {pathway} pathway".format(
                    pathway=row["TARGET_PATHWAY"].replace("Other, ", "")
                )
            self.data[DrugName(row["DRUG_NAME"], synonyms)] = target

    def retrieve(self, query: str) -> str:
        """
        Retrieves the targets of the compounds in the GDSC database.
        Input:
            query: a drug to query in the knowledge base.
        Returns:
            A string of the targets of the drug.
        """
        return self.data.get(DrugName(query), "No information found.")

    @classmethod
    def knowledge_description(
        cls, *args: Any, **kwargs: Dict[str, Any]
    ) -> str:
        """
        Returns a description of the knowledge.
        Input:
            None.
        Returns:
            The description of the knowledge base.
        """
        del args, kwargs
        return "Retrieves the targets of a drug."

    @classmethod
    def query_description(cls) -> str:
        """
        Returns a description of the expected query type.
        Input:
            None.
        Returns:
            The description of the expected query type.
        """
        return "The drug to retrieve information about."
