import re


def postprocess_answer_chartqa(raw_answer: str) -> str:
    """
    Postprocess the raw output string from the model following these steps:
    1 Extract content after "Answer:"
    2 Normalize text: lowercase, remove punctuation, trim spaces
    3 Convert number words to digits
    4 Expand contractions (e.g. dont → don't)
    5 Remove articles/stopwords
    6 Check for yes/no (high priority)
    7 Check for digits (counting)
    8 Check for known colors
    9 Check for known directions
    10 Return final cleaned result
    """
    # Step 1: Extract "Answer:" content
    answer = raw_answer.split("assistant\n")[-1].strip()

    # Step 2: Normalize text: keep only a-z, 0-9, apostrophe
    answer = answer.lower()  # Take first sentence and lowercase
    answer = re.sub(r'[^a-z0-9\.\']', ' ', answer)
    answer = ' '.join(answer.split()).strip()  # Normalize whitespace

    # Step 3: Convert number words to digits    
    number_words = {
        'zero': '0', 'one': '1', 'two': '2', 'three': '3', 'four': '4',
        'five': '5', 'six': '6', 'seven': '7', 'eight': '8', 'nine': '9',
        'ten': '10', 'eleven': '11', 'twelve': '12', 'thirteen': '13',
        'fourteen': '14', 'fifteen': '15', 'sixteen': '16', 'seventeen': '17',
        'eighteen': '18', 'nineteen': '19', 'twenty': '20', 'thirty': '30',
        'forty': '40', 'fifty': '50', 'sixty': '60', 'seventy': '70',
        'eighty': '80', 'ninety': '90', 'hundred': '100', 'thousand': '1000'
    }
    words = answer.split()
    answer = ' '.join([number_words.get(w, w) for w in words])

    # Step 4: Expand contractions
    contractions = {
        'dont': "don't", 'cant': "can't", 'wont': "won't", 'im': "i'm",
        'youre': "you're", 'theyre': "they're", 'hes': "he's", 'shes': "she's",
        'its': "it's", 'arent': "aren't", 'isnt': "isn't", 'wasnt': "wasn't",
        'werent': "weren't", 'doesnt': "doesn't", 'didnt': "didn't",
        'havent': "haven't", 'hasnt': "hasn't", 'hadnt': "hadn't",
        'wouldnt': "wouldn't", 'couldnt': "couldn't", 'shouldnt': "shouldn't",
        'ive': "i've", 'youve': "you've", 'theyve': "they've", 'weve': "we've",
        'theyd': "they'd", 'youd': "you'd", 'hed': "he'd", 'shed': "she'd",
        'id': "i'd", 'whos': "who's", 'whats': "what's", 'wheres': "where's",
        'whens': "when's", 'whys': "why's", 'hows': "how's"
    }
    for wrong, right in contractions.items():
        answer = re.sub(r'\b' + re.escape(wrong) + r'\b', right, answer)

    # Step 5: Remove articles and stopwords
    answer = re.sub(r'\b(a|an|the|on|in|at|of|for|are)\b', '', answer)
    answer = ' '.join(answer.split())

    # Step 6: Match yes/no
    match = re.search(r'\b(yes|no)\b', answer)
    if match:
        return match.group(1)

    # Step 7.1: Match time
    time = re.findall(r'\b\d+(?::\d+)\b', answer)
    if time:
        return time[0]

    # Step 7: Match digits
    numbers = re.findall(r'\b\d+(?:\.\d+)?\b', answer)
    if numbers:
        return numbers[0]

    # Step 8: Match color keywords
    color_keywords = {
        'red', 'blue', 'green', 'yellow', 'black', 'white', 'orange', 'purple',
        'pink', 'brown', 'gray', 'grey', 'silver', 'gold', 'beige', 'cyan',
        'maroon', 'olive', 'navy', 'lime', 'teal', 'turquoise', 'indigo'
    }
    color_pattern = r'\b(' + '|'.join(color_keywords) + r')\b(?:\s+and\s+\b(' + '|'.join(color_keywords) + r')\b)*'
    color_matches = re.findall(color_pattern, answer)
    if color_matches:
        flat = []
        for group in color_matches:
            flat.extend([g for g in group if g])
        return ' '.join(flat).strip()

    # Step 9: Match known directions
    direction_set = {
        'left', 'right', 'top', 'bottom', 'upper', 'lower', 'front', 'back',
        'middle', 'center', 'top-left', 'top-right', 'bottom-left', 'bottom-right'
    }
    direction_pattern = r'\b(' + '|'.join(direction_set) + r')\b(?:\s+and\s+\b(' + '|'.join(direction_set) + r')\b)*'
    direction_matches = re.findall(direction_pattern, answer)
    if direction_matches:
        flat = []
        for group in direction_matches:
            flat.extend([g for g in group if g])
        return ' '.join(flat).strip()

    # Step 10: Return final cleaned result
    return answer