#!/usr/bin/env python3
"""
Symbol Language Translator: translate geometric symbol language into natural language

Template-based translator, used between seed problem generation and instantiation
to translate the symbol language into natural language and remove unnecessary noise.
Supports translating all parts including problem, proof and original_constructions.
"""

import re
from typing import List, Dict, Tuple, Optional


class SymbolTranslator:
    """Translator from geometric symbol language to natural language"""
    
    def __init__(self):
        """Initialize the translator and define predicate and construction templates"""
        def _format_angle_value(value: str) -> str:
            """
            Format angle values, supporting degree notation ending with 'o'
            and pi-notation such as 1pi/2.
            """
            if not value:
                return value
            
            # handle degree notation ending with "o"
            if value.lower().endswith("o"):
                return value[:-1] + "°"
            
            # handle pi format such as "1pi/2", "pi/2", "2pi/3"
            import re
            import math
            
            # match pattern: optional number + pi + / + number
            # e.g. "1pi/2", "pi/2", "2pi/3", "3pi/4"
            pi_pattern = r'^(\d*)pi/(\d+)$'
            match = re.match(pi_pattern, value.lower())
            if match:
                numerator_str = match.group(1)
                denominator = int(match.group(2))
                
                # if numerator is empty, default to 1
                numerator = int(numerator_str) if numerator_str else 1
                
                # convert to degrees
                radians = (numerator * math.pi) / denominator
                degrees = math.degrees(radians)
                
                # use simplified representation for common angles
                if abs(degrees - 90) < 0.01:
                    return "90°"
                elif abs(degrees - 60) < 0.01:
                    return "60°"
                elif abs(degrees - 45) < 0.01:
                    return "45°"
                elif abs(degrees - 30) < 0.01:
                    return "30°"
                elif abs(degrees - 120) < 0.01:
                    return "120°"
                elif abs(degrees - 135) < 0.01:
                    return "135°"
                elif abs(degrees - 150) < 0.01:
                    return "150°"
                elif abs(degrees - 180) < 0.01:
                    return "180°"
                else:
                    # if not common angles, convert to degrees (integer or one decimal)
                    if abs(degrees - round(degrees)) < 0.01:
                        return f"{int(round(degrees))}°"
                    else:
                        return f"{degrees:.1f}°"
            
            return value
        
        # Chinese translation templates for geometric predicates
        self.predicate_templates = {
            # basic relations
            'coll': lambda args: f"Points {args[0].upper()}, {args[1].upper()}, {args[2].upper()} are collinear",
            'cong': lambda args: f"{args[0].upper()}{args[1].upper()} = {args[2].upper()}{args[3].upper()}",
            'para': lambda args: f"{args[0].upper()}{args[1].upper()} ∥ {args[2].upper()}{args[3].upper()}",
            'perp': lambda args: f"{args[0].upper()}{args[1].upper()} ⊥ {args[2].upper()}{args[3].upper()}",
            
            # special points
            'midp': lambda args: f"Point {args[2].upper()} is the midpoint of {args[0].upper()}{args[1].upper()}",
            
            # angle and ratio
            'eqangle': lambda args: (
                # 6 parameters: ∠ABC = ∠DEF
                f"∠{args[0].upper()}{args[1].upper()}{args[2].upper()} equals ∠{args[3].upper()}{args[4].upper()}{args[5].upper()}"
                if len(args) == 6
                # 8 parameters: angle(AB, CD) = angle(EF, GH)
                else f"∠({args[0].upper()}{args[1].upper()}, {args[2].upper()}{args[3].upper()}) equals ∠({args[4].upper()}{args[5].upper()}, {args[6].upper()}{args[7].upper()})"
                if len(args) == 8
                else f"∠{args[0].upper()}{args[1].upper()}{args[2].upper()} equals ∠{args[3].upper()}{args[4].upper()}{args[5].upper()}"
            ),
            'eqratio': lambda args: (
                f"{args[0].upper()}{args[1].upper()}:{args[2].upper()}{args[3].upper()} = {args[4].upper()}{args[5].upper()}:{args[6].upper()}{args[7].upper()}"
                if len(args) >= 8
                else f"{args[0].upper()}{args[1].upper()}:{args[2].upper()}{args[3].upper()} = {args[4]}"
                if len(args) == 5
                else f"{args[0].upper()}{args[1].upper()}:{args[2].upper()}{args[3].upper()} = {args[4].upper()}{args[5].upper()}:{args[6].upper()}{args[7].upper()}"
            ),
            
            # circle
            'cyclic': lambda args: f"Points {args[0].upper()}, {args[1].upper()}, {args[2].upper()}, {args[3].upper()} are concyclic",
            
            # triangle relations
            'simtri': lambda args: f"△{args[0].upper()}{args[1].upper()}{args[2].upper()} is similar to △{args[3].upper()}{args[4].upper()}{args[5].upper()}",
            'simtrir': lambda args: f"△{args[0].upper()}{args[1].upper()}{args[2].upper()} is similar to △{args[3].upper()}{args[4].upper()}{args[5].upper()}",
            'contri': lambda args: f"△{args[0].upper()}{args[1].upper()}{args[2].upper()} is congruent to △{args[3].upper()}{args[4].upper()}{args[5].upper()}",
            'contrir': lambda args: f"△{args[0].upper()}{args[1].upper()}{args[2].upper()} is congruent to △{args[3].upper()}{args[4].upper()}{args[5].upper()}",
            
            # constant relations
            'rconst': lambda args: f"{args[0].upper()}{args[1].upper()}:{args[2].upper()}{args[3].upper()} = {args[4]}",
            'rconst2': lambda args: f"{args[0].upper()}{args[1].upper()}:{args[2].upper()}{args[3].upper()} = {args[4]}",
            'lconst': lambda args: f"{args[0].upper()}{args[1].upper()} = {args[2]}",
            'aconst': lambda args, fmt=_format_angle_value: (
                f"∠{args[0].upper()}{args[1].upper()}{args[2].upper()} equals {fmt(args[3])}"
                if len(args) == 4
                else f"∠({args[0].upper()}{args[1].upper()}, {args[2].upper()}{args[3].upper()}) equals {fmt(args[4])}"
                if len(args) == 5
                else f"∠{args[0].upper()}{args[1].upper()}{args[2].upper()} equals {fmt(args[3])}"
            ),
            
            # computed relations (usually can be omitted as they are derived results)
            'rcompute': lambda args: f"{args[0].upper()}{args[1].upper()}:{args[2].upper()}{args[3].upper()} = {args[4]}",
            'acompute': lambda args, fmt=_format_angle_value: f"∠{args[0].upper()}{args[1].upper()}{args[2].upper()} equals {fmt(args[3])}",
            'lcompute': lambda args: f"{args[0].upper()}{args[1].upper()} = {args[2]}",
            
            # numerical checks (usually can be omitted or simplified)
            'sameclock': lambda args: f"Triangles {args[0].upper()}{args[1].upper()}{args[2].upper()} and {args[3].upper()}{args[4].upper()}{args[5].upper()} have the same orientation",
            'sameside': lambda args: f"Points {args[0].upper()} and {args[1].upper()} lie on the same side of line {args[2].upper()}{args[3].upper()}",
            'diff': lambda args: f"Points {args[0].upper()} and {args[1].upper()} are distinct",
            
            # other possible predicates
            'ncoll': lambda args: f"Points {args[0].upper()}, {args[1].upper()}, {args[2].upper()} are not collinear",
            'npara': lambda args: f"{args[0].upper()}{args[1].upper()} is not parallel to {args[2].upper()}{args[3].upper()}",
            'nperp': lambda args: f"{args[0].upper()}{args[1].upper()} is not perpendicular to {args[2].upper()}{args[3].upper()}",
            'nsameside': lambda args: f"Points {args[0].upper()} and {args[1].upper()} lie on opposite sides of line {args[2].upper()}{args[3].upper()}",
            
            # additional predicates (may appear in proof or numerical_check)
            'circle': lambda args: (
                f"Circle with center {args[0].upper()} passing through {args[1].upper()}"
                if len(args) == 2
                else f"Circle with center {args[0].upper()} passing through {args[1].upper()} and {args[2].upper()}"
                if len(args) == 3
                else f"Circle with center {args[0].upper()} passing through {args[1].upper()}, {args[2].upper()} and {args[3].upper()}"
            ),
        }
        
        # Chinese translation templates for constructions
        self.construction_templates = {
            # basic figures
            'triangle': lambda args: f"△{args[0].upper()}{args[1].upper()}{args[2].upper()}",
            'r_triangle': lambda args: f"Right triangle △{args[0].upper()}{args[1].upper()}{args[2].upper()}",
            'iso_triangle': lambda args: f"Isosceles triangle △{args[0].upper()}{args[1].upper()}{args[2].upper()}",
            'eq_triangle': lambda args: f"Equilateral triangle △{args[0].upper()}{args[1].upper()}{args[2].upper()}",
            'quadrangle': lambda args: f"Quadrilateral {args[0].upper()}{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            'rectangle': lambda args: f"Rectangle {args[0].upper()}{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            'square': lambda args: f"Square {args[0].upper()}{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            'trapezoid': lambda args: f"Trapezoid {args[0].upper()}{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            'r_trapezoid': lambda args: f"Right trapezoid {args[0].upper()}{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            'iso_trapezoid': lambda args: f"Isosceles trapezoid {args[0].upper()}{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            'eq_quadrangle': lambda args: f"Equilateral quadrilateral {args[0].upper()}{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            'eqdia_quadrangle': lambda args: f"Quadrilateral with equal diagonals {args[0].upper()}{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            'parallelogram': lambda args: f"Parallelogram {args[0].upper()}{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            
            # point constructions
            'free': lambda args: f"Free point {args[0].upper()}",
            'on_line': lambda args: f"Point {args[0].upper()} lies on line {args[1].upper()}{args[2].upper()}",
            'on_circle': lambda args: f"Point {args[0].upper()} lies on the circle with center {args[1].upper()} passing through {args[2].upper()}",
            'on_circum': lambda args: f"Point {args[0].upper()} lies on the circumcircle through {args[1].upper()}, {args[2].upper()}, {args[3].upper()}",
            'midpoint': lambda args: f"Point {args[0].upper()} is the midpoint of {args[1].upper()}{args[2].upper()}",
            
            # special points (based on defs.txt)
            # circumcenter x a b c: x is the circumcenter of △abc (cong x a x b, cong x b x c)
            'circumcenter': lambda args: f"Point {args[0].upper()} is the circumcenter of △{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            # incenter x a b c: x is the incenter of △abc
            # eqangle a b a i a i a c, eqangle c a c i c i c b (intersection of two angle bisectors)
            'incenter': lambda args: f"Point {args[0].upper()} is the incenter of △{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            # incenter2 x y z i a b c: i is the incenter, x,y,z are feet of perpendiculars
            'incenter2': lambda args: (
                f"Point {args[3].upper()} is the incenter of △{args[4].upper()}{args[5].upper()}{args[6].upper()}, and {args[0].upper()}, {args[1].upper()}, {args[2].upper()} are the feet of its perpendiculars to the sides"
                if len(args) == 7
                else f"Point {args[0].upper()} is the incenter and related points"
            ),
            # excenter x a b c: x is an excenter of △abc
            'excenter': lambda args: f"Point {args[0].upper()} is an excenter of △{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            # excenter2 x y z i a b c: i is the excenter, x,y,z are feet of perpendiculars
            'excenter2': lambda args: (
                f"Point {args[3].upper()} is an excenter of △{args[4].upper()}{args[5].upper()}{args[6].upper()}, and {args[0].upper()}, {args[1].upper()}, {args[2].upper()} are the feet of its perpendiculars to the sides"
                if len(args) == 7
                else f"Point {args[0].upper()} is an excenter and related points"
            ),
            # orthocenter x a b c: x is the orthocenter of △abc (perp x a b c, perp x b c a)
            'orthocenter': lambda args: f"Point {args[0].upper()} is the orthocenter of △{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            # centroid x y z i a b c: i is the centroid, x,y,z are midpoints
            'centroid': lambda args: (
                f"Point {args[3].upper()} is the centroid of △{args[4].upper()}{args[5].upper()}{args[6].upper()}, and {args[0].upper()}, {args[1].upper()}, {args[2].upper()} are the midpoints of the sides"
                if len(args) == 7
                else f"Point {args[0].upper()} is the centroid"
            ),
            # ninepoints x y z i a b c: x,y,z are midpoints, i is nine-point center
            'ninepoints': lambda args: (
                f"Points {args[0].upper()}, {args[1].upper()}, {args[2].upper()} are the midpoints of the sides of △{args[4].upper()}{args[5].upper()}{args[6].upper()}, and point {args[3].upper()} is the center of the nine-point circle"
                if len(args) == 7
                else f"Points related to the nine-point circle"
            ),
            
            # other constructions
            # circle x a b c: x is circumcenter of △abc (cong x a x b, cong x b x c)
            'circle': lambda args: (
                f"Point {args[0].upper()} is the circumcenter of △{args[1].upper()}{args[2].upper()}{args[3].upper()}"
                if len(args) == 4
                else f"Circle related point"
            ),
            # foot x a b c: x is the foot from A to line BC (perp x a b c, coll x b c)
            'foot': lambda args: f"Point {args[0].upper()} is the foot from {args[1].upper()} to line {args[2].upper()}{args[3].upper()}",
            'mirror': lambda args: f"Point {args[0].upper()} is the reflection of {args[1].upper()} about point {args[2].upper()}",
            'angle_bisector': lambda args: f"The angle bisector of ∠{args[1].upper()}{args[2].upper()}{args[3].upper()} passes through point {args[0].upper()}",
            'angle_mirror': lambda args: f"Point {args[0].upper()} is the reflection of {args[1].upper()} about the angle bisector of ∠{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            
            # complex constructions (line constructions related to angles and directions)
            # on_aline x a b c d e: x such that ∠axab = ∠dcde (eqangle a x a b d c d e)
            'on_aline': lambda args: f"Point {args[0].upper()} satisfies ∠{args[2].upper()}{args[1].upper()}{args[0].upper()} = ∠{args[5].upper()}{args[4].upper()}{args[3].upper()}",
            # on_aline0 x a b c d e f g: x such that ∠abcd = ∠efgx (eqangle a b c d e f g x)
            'on_aline0': lambda args: f"Point {args[0].upper()} satisfies ∠({args[1].upper()}{args[2].upper()}, {args[3].upper()}{args[4].upper()}) = ∠({args[5].upper()}{args[6].upper()}, {args[7].upper()}{args[0].upper()})",
            # on_aline2: incomplete construction in AlphaGeometry, list parameters directly
            'on_aline2': lambda args: f"on_aline2 construction with parameters: {', '.join([a.upper() for a in args])}",
            # on_bline x a b: x on perpendicular bisector of AB (cong x a x b, eqangle a x a b b a b x)
            'on_bline': lambda args: f"Point {args[0].upper()} lies on the perpendicular bisector of segment {args[1].upper()}{args[2].upper()}",
            # on_tline x a b c: x on line through A perpendicular to BC (perp x a b c)
            'on_tline': lambda args: f"Point {args[0].upper()} lies on the line through {args[1].upper()} perpendicular to {args[2].upper()}{args[3].upper()}",
            # on_dia x a b: x on circle with diameter AB (perp x a x b)
            'on_dia': lambda args: f"Point {args[0].upper()} lies on the circle with diameter {args[1].upper()}{args[2].upper()}",
            # on_pline x a b c: x on line through A parallel to BC (para x a b c)
            'on_pline': lambda args: f"Point {args[0].upper()} lies on the line through {args[1].upper()} parallel to {args[2].upper()}{args[3].upper()}",
            # on_pline0 x a b c: same as on_pline (para x a b c)
            'on_pline0': lambda args: f"Point {args[0].upper()} lies on the line through {args[1].upper()} parallel to {args[2].upper()}{args[3].upper()}",
            # on_opline: possibly "opposite parallel line" (not clearly defined, conservative wording)
            'on_opline': lambda args: (
                f"Point {args[0].upper()} lies on an opposite parallel line"
                if len(args) <= 3
                else f"Point {args[0].upper()} lies on a line satisfying a specific parallel relation"
            ),
            
            # intersection constructions
            'intersection_ll': lambda args: (
                f"Point {args[0].upper()} is the intersection of lines {args[1].upper()}{args[2].upper()} and {args[3].upper()}{args[4].upper()}"
                if len(args) == 5
                else f"Point {args[0].upper()} is the intersection of lines {args[1].upper()}{args[2].upper()} and {args[3].upper()}{args[4].upper()}"
            ),
            'intersection_lc': lambda args: f"Point {args[0].upper()} is the intersection of line {args[1].upper()}{args[2].upper()} and the circle with center {args[3].upper()} passing through {args[4].upper()}",
            'intersection_cc': lambda args: (
                f"Point {args[0].upper()} is the intersection of the circle with center {args[1].upper()} passing through {args[3].upper()} and the circle with center {args[2].upper()} passing through {args[3].upper()}"
                if len(args) == 4
                else f"Point {args[0].upper()} is the intersection of the circle with center {args[1].upper()} passing through {args[2].upper()} and the circle with center {args[3].upper()} passing through {args[4].upper()}"
            ),
            'intersection_lp': lambda args: f"Point {args[0].upper()} is the intersection of line {args[1].upper()}{args[2].upper()} and the line through {args[3].upper()} parallel to {args[4].upper()}{args[5].upper()}",
            'intersection_lt': lambda args: f"Point {args[0].upper()} is the intersection of line {args[1].upper()}{args[2].upper()} and the line through {args[3].upper()} perpendicular to {args[4].upper()}{args[5].upper()}",
            'intersection_pp': lambda args: f"Point {args[0].upper()} is the intersection of the line through {args[1].upper()} parallel to {args[2].upper()}{args[3].upper()} and the line through {args[4].upper()} parallel to {args[5].upper()}{args[6].upper()}",
            'intersection_tt': lambda args: f"Point {args[0].upper()} is the intersection of the line through {args[1].upper()} perpendicular to {args[2].upper()}{args[3].upper()} and the line through {args[4].upper()} perpendicular to {args[5].upper()}{args[6].upper()}",
            
            # tangent constructions (based on defs.txt)
            # lc_tangent x a o: x lies on line through A perpendicular to AO (perp a x a o)
            'lc_tangent': lambda args: f"Point {args[0].upper()} lies on the line through {args[1].upper()} perpendicular to {args[1].upper()}{args[2].upper()} (tangent construction)",
            # cc_tangent x y z i o a w b: four points on common tangents of two circles
            # x y: cong o x o a, cong w y w b, perp x o x y, perp y w y x
            # z i: cong o z o a, cong w i w b, perp z o z i, perp i w i z
            'cc_tangent': lambda args: (
                f"Points {args[0].upper()}, {args[1].upper()}, {args[2].upper()}, {args[3].upper()} lie on the common tangents of the circle with center {args[4].upper()} passing through {args[5].upper()} and the circle with center {args[6].upper()} passing through {args[7].upper()}"
                if len(args) == 8
                else f"Points {', '.join([a.upper() for a in args[:4]])} lie on the common tangents of two circles"
            ),
            # tangent x y a o b: x,y lie on the tangent through A to the circle with center O passing through B
            # x: cong o x o b, perp a x o x; y: cong o y o b, perp a y o y
            'tangent': lambda args: (
                f"Points {args[0].upper()} and {args[1].upper()} lie on the tangent through {args[2].upper()} to the circle with center {args[3].upper()} passing through {args[4].upper()}"
                if len(args) == 5
                else f"Points {args[0].upper()} and {args[1].upper()} lie on a tangent line"
            ),
            
            # equal distance constructions (based on defs.txt)
            # eqdistance x a b c: x lies on circle centered at A with radius BC (cong x a b c)
            'eqdistance': lambda args: f"Point {args[0].upper()} satisfies {args[0].upper()}{args[1].upper()} = {args[2].upper()}{args[3].upper()}",
            
            # square-related constructions (based on defs.txt)
            # nsquare x a b: △xab is an isosceles right triangle (negative 90-degree rotation)
            # cong x a a b, perp x a a b (rotaten90 a b)
            'nsquare': lambda args: f"Point {args[0].upper()} makes △{args[0].upper()}{args[1].upper()}{args[2].upper()} an isosceles right triangle ({args[0].upper()}{args[1].upper()} = {args[1].upper()}{args[2].upper()} and {args[0].upper()}{args[1].upper()} ⊥ {args[1].upper()}{args[2].upper()})",
            # psquare x a b: △xab is an isosceles right triangle (positive 90-degree rotation)
            # cong x a a b, perp x a a b (rotatep90 a b)
            'psquare': lambda args: f"Point {args[0].upper()} makes △{args[0].upper()}{args[1].upper()}{args[2].upper()} an isosceles right triangle ({args[0].upper()}{args[1].upper()} = {args[1].upper()}{args[2].upper()} and {args[0].upper()}{args[1].upper()} ⊥ {args[1].upper()}{args[2].upper()})",
            # isquare a b c d: square abcd
            'isquare': lambda args: f"Square {args[0].upper()}{args[1].upper()}{args[2].upper()}{args[3].upper()}",
            
            # angle constructions (based on defs.txt)
            # s_angle x a b y: x such that ∠abx = y° (aconst a b b x y)
            's_angle': lambda args, fmt=_format_angle_value: f"Point {args[0].upper()} satisfies ∠{args[1].upper()}{args[2].upper()}{args[0].upper()} equals {fmt(args[3])}",
            # eqangle2 x a b c: x such that ∠abax = ∠cxcb (eqangle a b a x c x c b)
            'eqangle2': lambda args: f"Point {args[0].upper()} satisfies ∠{args[2].upper()}{args[1].upper()}{args[0].upper()} equals ∠{args[0].upper()}{args[3].upper()}{args[2].upper()}",
            # eqangle3 x a b d e f: x such that ∠xaxb = ∠dedf (eqangle x a x b d e d f)
            'eqangle3': lambda args: f"Point {args[0].upper()} satisfies ∠{args[1].upper()}{args[0].upper()}{args[2].upper()} equals ∠{args[4].upper()}{args[3].upper()}{args[5].upper()}",
            
            # ratio constructions (based on defs.txt)
            # eqratio x a b c d e f g: x such that AB:CD = EF:GX (eqratio a b c d e f g x)
            'eqratio': lambda args: (
                f"Point {args[0].upper()} satisfies {args[1].upper()}{args[2].upper()}:{args[3].upper()}{args[4].upper()} = {args[5].upper()}{args[6].upper()}:{args[7].upper()}{args[0].upper()}"
                if len(args) == 8
                else f"Point {args[0].upper()} satisfies a ratio relation"
            ),
            # eqratio6 x a c e f g h: x such that AX:CX = EF:GH (eqratio a x c x e f g h)
            'eqratio6': lambda args: (
                f"Point {args[0].upper()} satisfies {args[1].upper()}{args[0].upper()}:{args[2].upper()}{args[0].upper()} = {args[3].upper()}{args[4].upper()}:{args[5].upper()}{args[6].upper()}"
                if len(args) == 7
                else f"Point {args[0].upper()} satisfies a ratio relation"
            ),
            
            # triangle constructions (based on defs.txt)
            # triangle12 a b c: triangle with AB:AC = 1:2 (rconst a b a c 1/2)
            'triangle12': lambda args: f"△{args[0].upper()}{args[1].upper()}{args[2].upper()}, with {args[0].upper()}{args[1].upper()}:{args[0].upper()}{args[2].upper()} = 1:2",
            # ieq_triangle a b c: equilateral triangle (cong a b b c, cong b c c a)
            'ieq_triangle': lambda args: f"Equilateral triangle △{args[0].upper()}{args[1].upper()}{args[2].upper()}",
            # risos a b c: isosceles right triangle (perp a b a c, cong a b a c)
            'risos': lambda args: f"Isosceles right triangle △{args[0].upper()}{args[1].upper()}{args[2].upper()} ({args[0].upper()}{args[1].upper()} ⊥ {args[0].upper()}{args[2].upper()} and {args[0].upper()}{args[1].upper()} = {args[0].upper()}{args[2].upper()})",
            # iso_triangle0 a b c: isosceles triangle (cong a b a c)
            'iso_triangle0': lambda args: f"Isosceles triangle △{args[0].upper()}{args[1].upper()}{args[2].upper()} ({args[0].upper()}{args[1].upper()} = {args[0].upper()}{args[2].upper()})",
            
            # partition constructions (based on defs.txt)
            # trisect x y a b c: x,y on AC, trisect ∠abc
            # coll x a c, coll y a c, eqangle b a b x b x b y, eqangle b x b y b y b c
            'trisect': lambda args: (
                f"Points {args[0].upper()} and {args[1].upper()} lie on segment {args[2].upper()}{args[4].upper()} and trisect ∠{args[2].upper()}{args[3].upper()}{args[4].upper()}"
                if len(args) == 5
                else f"Points {args[0].upper()} and {args[1].upper()} trisect an angle"
            ),
            # trisegment x y a b: x,y on AB, trisect AB
            # coll x a b, coll y a b, cong x a x y, cong y x y b
            'trisegment': lambda args: (
                f"Points {args[0].upper()} and {args[1].upper()} lie on segment {args[2].upper()}{args[3].upper()} and trisect it"
                if len(args) == 4
                else f"Points {args[0].upper()} and {args[1].upper()} trisect a segment"
            ),
            
            # other special constructions (based on defs.txt)
            'pentagon': lambda args: f"Pentagon {args[0].upper()}{args[1].upper()}{args[2].upper()}{args[3].upper()}{args[4].upper()}",
            'segment': lambda args: f"Segment {args[0].upper()}{args[1].upper()}",
            # shift x b c d: x is translation of B by vector DC (cong x b c d, cong x c b d)
            'shift': lambda args: (
                f"Point {args[0].upper()} is obtained by translating point {args[1].upper()} by vector {args[3].upper()}{args[2].upper()}"
                if len(args) == 4
                else f"Point {args[0].upper()} is obtained by translating point {args[1].upper()}"
            ),
            # reflect x a b c: x is reflection of A about line BC (cong b a b x, cong c a c x)
            'reflect': lambda args: (
                f"Point {args[0].upper()} is the reflection of {args[1].upper()} about line {args[2].upper()}{args[3].upper()}"
                if len(args) == 4
                else f"Point {args[0].upper()} is a reflection point"
            ),
            # 3peq x y z a b c: x,y on sides of △abc, z on bc, such that zx=zy
            # z: coll z b c; x y: coll x a b, coll y a c, coll x y z, cong z x z y
            '3peq': lambda args: (
                f"Point {args[2].upper()} lies on side {args[4].upper()}{args[5].upper()}, point {args[0].upper()} lies on side {args[3].upper()}{args[4].upper()}, point {args[1].upper()} lies on side {args[3].upper()}{args[5].upper()}, and {args[2].upper()}{args[0].upper()} = {args[2].upper()}{args[1].upper()}"
                if len(args) == 6
                else f"Points {args[0].upper()}, {args[1].upper()}, {args[2].upper()} satisfy an equal-distance relation"
            ),
        }
    
    def is_predicate_supported(self, predicate: str) -> bool:
        """
        Check whether a predicate is supported for translation.
        
        Args:
            predicate: predicate name
        
        Returns:
            True if the predicate is supported, False otherwise
        """
        return predicate in self.predicate_templates
    
    def translate_predicate(self, predicate: str, args: List[str]) -> Optional[str]:
        """
        Translate a single predicate.
        
        Args:
            predicate: predicate name
            args: list of arguments
        
        Returns:
            Natural language translation, or None if translation fails
        """
        if predicate not in self.predicate_templates:
            # if the predicate is not in templates, fall back to raw format
            return f"{predicate}({', '.join(args)})"
        
        try:
            template_func = self.predicate_templates[predicate]
            return template_func(args)
        except (IndexError, Exception):
            return f"{predicate}({', '.join(args)})"
    
    def is_construction_supported(self, construct_type: str) -> bool:
        """
        Check whether a construction type is supported for translation.
        
        Args:
            construct_type: construction type name
        
        Returns:
            True if the construction type is supported, False otherwise
        """
        return construct_type in self.construction_templates
    
    def translate_construction(self, construct_type: str, args: List[str]) -> str:
        """
        Translate a single construction.
        
        Args:
            construct_type: construction type
            args: list of arguments
        
        Returns:
            Natural language translation.
        """
        if construct_type not in self.construction_templates:
            # if the construction type is not in templates, return a simplified description
            result = f"{construct_type}({', '.join(args)})"
        else:
            try:
                template_func = self.construction_templates[construct_type]
                result = template_func(args)
            except (IndexError, Exception):
                result = f"{construct_type}({', '.join(args)})"
        
        return result
    
    def parse_problem(self, problem_text: str) -> Tuple[List[str], List[Tuple[str, List[str], str]], Optional[str]]:
        """
        Parse the problem text and extract points, premises and goal.
        
        Args:
            problem_text: e.g. "a : ; b : ; c : ; d : coll b c d [000] cong b d c d [001] ? simtri a b c e d c"
        
        Returns:
            (points, premises, goal) where:
            - points: list of points
            - premises: [(predicate, args, id), ...]
            - goal: goal predicate and arguments (if any)
        """
        points = []
        premises = []
        goal = None
        
        # split premises and goal by '?'
        if "?" in problem_text:
            parts = problem_text.split("?", 1)
            premises_part = parts[0].strip()
            goal_part = parts[1].strip()
        else:
            premises_part = problem_text.strip()
            goal_part = None
        
        # extract point definitions like "a : ; b : ; c :", filter out helper points x00, x01, ...
        point_pattern = r'(\w+)\s*:'
        for match in re.finditer(point_pattern, premises_part):
            point_name = match.group(1)
            # filter out names like x00, x01, ...
            if not re.match(r'^x\d+$', point_name, re.IGNORECASE):
                if point_name not in points:
                    points.append(point_name)
        
        # extract premises: "predicate arg1 arg2 ... [id]", filter helper points x00, ...
        premise_pattern = r'(\w+)\s+([a-z0-9\s/]+?)\s+\[(\d+)\]'
        for match in re.finditer(premise_pattern, premises_part):
            pred_name = match.group(1)
            args_str = match.group(2).strip()
            pred_id = match.group(3)
            # filter out helper points x00, x01, ...
            args = [
                a.strip() for a in args_str.split() 
                if a.strip() and not re.match(r'^x\d+$', a.strip(), re.IGNORECASE)
            ]
            if args:  # only keep predicates with valid arguments
                premises.append((pred_name, args, pred_id))
        
        # extract goal: "predicate arg1 arg2 ...", filter helper points x00, x01, ...
        if goal_part:
            goal_match = re.match(r'(\w+)\s+(.+)', goal_part.strip())
            if goal_match:
                pred_name = goal_match.group(1)
                args_str = goal_match.group(2).strip()
                # Filter out meaningless helper points like x00, x01, ...
                args = [
                    a.strip() for a in args_str.split() 
                    if a.strip() and not re.match(r'^x\d+$', a.strip(), re.IGNORECASE)
                ]
                if args:  # Only add goals with valid arguments
                    goal = (pred_name, args)
        
        return points, premises, goal
    
    def parse_proof(self, proof_text: str) -> List[Tuple[str, List[str], str, Optional[str]]]:
        """
        Parse proof text and extract proof steps.
        
        Args:
            proof_text: e.g. "para a f b f [009] r82 [004] ; eqangle a b b c b f b d [010] AR [004] [000] [009] ; ..."
        
        Returns:
            List of tuples (predicate, args, step_id, rule)
        """
        steps = []
        # split steps by semicolon
        # pattern: predicate args [id] rule_refs
        step_pattern = r'(\w+)\s+([a-z0-9\s/]+?)\s+\[(\d+)\]\s+([^;]*?)(?=\s*;|$)'
        for match in re.finditer(step_pattern, proof_text):
            pred_name = match.group(1)
            args_str = match.group(2).strip()
            step_id = match.group(3)
            rule_part = match.group(4).strip()
            args = [a.strip() for a in args_str.split() if a.strip()]
            # extract rule (usually rXX or AR)
            rule_match = re.search(r'([r]\d+|AR)', rule_part)
            rule = rule_match.group(1) if rule_match else None
            steps.append((pred_name, args, step_id, rule))
        return steps
    
    def parse_constructions(self, constructions_text: str) -> List[Tuple[List[str], str, List[str], int]]:
        """
        Parse the original_constructions text.
        
        Args:
            constructions_text: e.g. "a b c : r_triangle a b c; d : free d; e : on_line e a b; ..."
        
        Returns:
            [(points, construct_type, args, clause_index), ...]
        """
        constructions = []
        # split constructions by semicolon
        clauses = constructions_text.split(';')
        clause_index = 0
        for clause in clauses:
            clause = clause.strip()
            if not clause:
                continue
            # split points and construction: "points : construct_type args" or "point : construct_type args"
            if ':' in clause:
                clause_index += 1
                parts = clause.split(':', 1)
                points_str = parts[0].strip()
                construct_part = parts[1].strip()
                points = [p.strip() for p in points_str.split() if p.strip()]
                # support multiple constructions separated by commas
                construct_segments = [seg.strip() for seg in construct_part.split(',') if seg.strip()]
                for segment in construct_segments:
                    construct_match = re.match(r'(\w+)\s+(.+)', segment)
                    if construct_match:
                        construct_type = construct_match.group(1)
                        args_str = construct_match.group(2).strip()
                        args = [
                            token.strip().strip(',;')
                            for token in args_str.split()
                            if token.strip().strip(',;')
                        ]
                        constructions.append((points, construct_type, args, clause_index))
        return constructions
    
    def translate_problem(self, problem_text: str, simplify: bool = True) -> str:
        """
        Translate the whole problem text into natural language.
        
        Args:
            problem_text: problem text in symbol language
            simplify: whether to simplify output (remove redundancy)
        
        Returns:
            Natural language description
        """
        if not problem_text or not problem_text.strip():
            return ""
        
        # parse problem
        points, premises, goal = self.parse_problem(problem_text)
        
        # translate premises
        premise_translations = []
        for pred_name, args, pred_id in premises:
            translation = self.translate_predicate(pred_name, args)
            if translation:
                premise_translations.append(translation)
        
        # translate goal
        goal_translation = None
        if goal:
            pred_name, args = goal
            goal_translation = self.translate_predicate(pred_name, args)
        
        # combine result
        parts = []
        
        # premises
        if premise_translations:
            if simplify:
                # simplify: merge similar predicates and remove redundancy
                premise_translations = self._simplify_premises(premise_translations)
            parts.append("Given: " + "; ".join(premise_translations))
        
        # goal
        if goal_translation:
            parts.append("To prove: " + goal_translation)
        
        result = ". ".join(parts)
        if result and not result.endswith("."):
            result += "."
        
        return result
    
    def translate_proof(self, proof_text: str, simplify: bool = True) -> str:
        """
        Translate proof text into natural language.
        
        Args:
            proof_text: proof in symbol language
            simplify: whether to simplify output (ignore rule references)
        
        Returns:
            Natural language description
        """
        if not proof_text or not proof_text.strip():
            return ""
        
        steps = self.parse_proof(proof_text)
        if not steps:
            return ""
        
        step_translations = []
        for pred_name, args, step_id, rule in steps:
            translation = self.translate_predicate(pred_name, args)
            if translation:
                if simplify:
                    step_translations.append(translation)
                else:
                    step_translations.append(f"{translation} [step {step_id}]")
        
        if simplify:
            # remove duplicate steps
            seen = set()
            unique_steps = []
            for step in step_translations:
                if step not in seen:
                    seen.add(step)
                    unique_steps.append(step)
            step_translations = unique_steps
        
        return "; ".join(step_translations) + "."
    
    def translate_constructions(self, constructions_text: str, simplify: bool = True) -> str:
        """
        Translate original_constructions text into natural language.
        
        Args:
            constructions_text: constructions in symbol language
            simplify: whether to simplify output
        
        Returns:
            Natural language description
        """
        if not constructions_text or not constructions_text.strip():
            return ""
        
        constructions = self.parse_constructions(constructions_text)
        if not constructions:
            return ""
        
        grouped_translations = []
        for points, construct_type, args, clause_idx in constructions:
            translation = self.translate_construction(construct_type, args)
            if not translation:
                continue
            if grouped_translations and grouped_translations[-1]['clause'] == clause_idx:
                grouped_translations[-1]['translations'].append(translation)
            else:
                grouped_translations.append({
                    'clause': clause_idx,
                    'points': points,
                    'translations': [translation],
                })
        
        if not grouped_translations:
            return ""
        
        sentences = []
        for group in grouped_translations:
            items = group['translations']
            if not items:
                continue
            if len(items) == 1:
                sentences.append(items[0])
            else:
                sentences.append("; ".join(items))
        
        return ". ".join(sentences) + "."
    
    def translate_problem_origin(self, problem_origin: str) -> str:
        """
        Directly translate the problem_origin format.
        
        Format: "a : ; b : ; c : coll c a b, cong c a c b"
        - "a :" or "a : ;" means "construct point A"
        - "a : coll a b c" means "construct point A such that coll a b c"
        - "a : coll a b c, cong a b c d" means "construct point A such that coll a b c and cong a b c d"
        
        Args:
            problem_origin: string in problem_origin format
        
        Returns:
            Natural language description
        """
        if not problem_origin or not problem_origin.strip():
            return ""
        
        import re
        sentences: List[str] = []
        
        # split definitions of each point by semicolon
        clauses = re.split(r';\s*', problem_origin.strip())
 
        for clause in clauses:
            clause = clause.strip()
            if not clause:
                continue
            
            # match point definitions such as
            # "a :", "a b c :", "a : coll a b c" or "a b c : xxx xxx xxx"
            match = re.match(r'^(\w+(?:\s+\w+)*)\s*:\s*(.*)$', clause)
            if not match:
                continue
            
            points_str = match.group(1)
            statements_str = match.group(2).strip()
            
            # extract all points, filter out helper points x00, x01, ...
            points = [
                p.strip().upper() 
                for p in points_str.split() 
                if p.strip() and not re.match(r'^x\d+$', p.strip(), re.IGNORECASE)
            ]
            
            if not points:
                continue

            # if there is no statement, it simply means "construct point(s)"
            if not statements_str or statements_str == ';':
                if len(points) == 1:
                    sentences.append(f"Construct point {points[0]}")
                else:
                    pts = ", ".join(points)
                    sentences.append(f"Construct points {pts}")
                continue
            
            # handle multiple statements, which may be comma-separated
            # or separated by ids in brackets
            comma_separated = [s.strip() for s in statements_str.split(',') if s.strip()]
            
            if len(comma_separated) == 1 and '[' in statements_str:
                # split by indexes like [000], [001], ...
                parts = re.split(r'(\[\d+\])', statements_str)
                statements: List[str] = []
                current_stmt = ""
                for part in parts:
                    current_stmt += part
                    if part.startswith('[') and part.endswith(']'):
                        if current_stmt.strip():
                            statements.append(current_stmt.strip())
                        current_stmt = ""
                if current_stmt.strip():
                    statements.append(current_stmt.strip())
            else:
                statements = comma_separated
            
            if not statements:
                if len(points) == 1:
                    sentences.append(f"Construct point {points[0]}")
                else:
                    pts = ", ".join(points)
                    sentences.append(f"Construct points {pts}")
                continue
            
            # translate each statement
            translated_statements: List[str] = []
            for stmt in statements:
                stmt_parts = stmt.strip().split()
                if not stmt_parts:
                    continue
                
                pred_name = stmt_parts[0]
                # filter out ids like [000] and helper points x00, x01, ...
                args = [
                    arg for arg in stmt_parts[1:] 
                    if not (arg.startswith('[') and arg.endswith(']'))
                    and not re.match(r'^x\d+$', arg.strip(), re.IGNORECASE)
                ]
                
                translation = self.translate_predicate(pred_name, args)
                if translation:
                    translated_statements.append(translation)
                else:
                    translated_statements.append(f"{pred_name}({', '.join(args)})")
            
            if translated_statements:
                cond = " and ".join(translated_statements)
                if len(points) == 1:
                    sentences.append(f"Construct point {points[0]} such that {cond}")
                else:
                    pts = ", ".join(points)
                    sentences.append(f"Construct points {pts} such that {cond}")
            else:
                if len(points) == 1:
                    sentences.append(f"Construct point {points[0]}")
                else:
                    pts = ", ".join(points)
                    sentences.append(f"Construct points {pts}")
        
        return ". ".join(sentences) + "."
    
    def translate_llm_input(self, llm_input: str) -> str:
        """
        Extract and translate the problem part from a full llm_input_renamed.
        
        Args:
            llm_input: full llm_input_renamed string containing a <problem> tag
        
        Returns:
            Natural language translation of the problem
        """
        # extract content inside <problem> tag
        match = re.search(r'<problem>(.*?)</problem>', llm_input, re.DOTALL)
        if not match:
            return ""
        
        problem_text = match.group(1).strip()
        clauses = [clause.strip() for clause in problem_text.split(';') if clause.strip()]
        translated_parts = []
        free_points = []
        
        for clause in clauses:
            if ':' not in clause:
                translated = self.translate_problem(clause)
                if translated:
                    translated_parts.append(translated)
                continue
            
            lhs, rhs = clause.split(':', 1)
            points = [p.strip() for p in lhs.split() if p.strip()]
            rhs = rhs.strip()
            if not rhs:
                free_points.extend(points)
                continue
            
            translated = self.translate_problem(clause)
            if translated:
                translated_parts.append(translated)
        
        if free_points:
            if len(free_points) == 1:
                free_desc = f"Construct point {free_points[0].upper()}"
            else:
                pts = ", ".join(p.upper() for p in free_points)
                free_desc = f"Construct points {pts}"
            translated_parts.insert(0, free_desc + ".")
        
        return ". ".join(translated_parts).strip(". ")
    
    def translate_llm_output(self, llm_output: str) -> Dict[str, str]:
        """
        Extract and translate all parts from a full llm_output_renamed.
        
        Args:
            llm_output: full llm_output_renamed string containing <aux>, <numerical_check>, <proof> tags
        
        Returns:
            Dictionary containing translated aux, numerical_check and proof
        """
        result = {}
        
        # extract aux part
        aux_match = re.search(r'<aux>(.*?)</aux>', llm_output, re.DOTALL)
        if aux_match:
            aux_text = aux_match.group(1).strip()
            # aux format is similar to problem_origin; reuse translate_problem_origin
            if aux_text:
                result['aux'] = self.translate_problem_origin(aux_text)
        
        # extract numerical_check part (often ignorable or simplified)
        num_check_match = re.search(r'<numerical_check>(.*?)</numerical_check>', llm_output, re.DOTALL)
        if num_check_match:
            num_check_text = num_check_match.group(1).strip()
            # parse predicates in numerical_check
            predicates = re.findall(r'(\w+)\s+([a-z0-9\s]+?)\s+\[(\d+)\]', num_check_text)
            if predicates:
                translations = []
                for pred_name, args_str, _ in predicates:
                    args = [a.strip() for a in args_str.split() if a.strip()]
                    trans = self.translate_predicate(pred_name, args)
                    if trans:
                        translations.append(trans)
                if translations:
                    result['numerical_check'] = "; ".join(translations) + "."
        
        # extract proof part
        proof_match = re.search(r'<proof>(.*?)</proof>', llm_output, re.DOTALL)
        if proof_match:
            proof_text = proof_match.group(1).strip()
            result['proof'] = self.translate_proof(proof_text, simplify=True)
        
        return result
    
    def _simplify_premises(self, premises: List[str]) -> List[str]:
        """
        Simplify a list of premise translations and remove redundancy.
        
        Args:
            premises: list of premise translations
        
        Returns:
            Simplified list of premises
        """
        if not premises:
            return premises
        
        # deduplicate
        seen = set()
        unique_premises = []
        for p in premises:
            if p not in seen:
                seen.add(p)
                unique_premises.append(p)
        
        # previously merged midpoint information in Chinese; now just return unique premises
        return unique_premises


def main():
    """Test function"""
    translator = SymbolTranslator()
    
    # test problem translation
    print("=" * 60)
    print("Problem translation test")
    print("=" * 60)
    test_problems = [
        "a : ; b : ; c : ; d : coll b c d [000] cong b d c d [001] ; e : coll a c e [002] cong a e c e [003] ? simtri a b c e d c",
        "a : ; b : ; c : coll a b c [000] cong a b b c [001] ? rconst a b a c 1/2",
    ]
    for i, test_case in enumerate(test_problems, 1):
        print(f"\nTest case {i}:")
        print(f"Input: {test_case}")
        result = translator.translate_problem(test_case)
        print(f"Output: {result}")
    
    # test proof translation
    print("\n" + "=" * 60)
    print("Proof translation test")
    print("=" * 60)
    test_proof = "para a f b f [009] r82 [004] ; eqangle a b b c b f b d [010] AR [004] [000] [009] ; midp a b f [011] r54 [004] [005] ;"
    print(f"Input: {test_proof}")
    result = translator.translate_proof(test_proof)
    print(f"Output: {result}")
    
    # test constructions translation
    print("\n" + "=" * 60)
    print("Constructions translation test")
    print("=" * 60)
    test_constructions = "a b c : r_triangle a b c; d : free d; e : on_line e a b; g : excenter g a d e;"
    print(f"Input: {test_constructions}")
    result = translator.translate_constructions(test_constructions)
    print(f"Output: {result}")


if __name__ == "__main__":
    main()
