import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline
from sklearn.compose import TransformedTargetRegressor
from sklearn.ensemble import RandomForestRegressor, GradientBoostingRegressor
from sklearn.linear_model import Ridge, Lasso
import matplotlib.pyplot as plt
from sklearn.tree import plot_tree
import seaborn as sns
from scipy.optimize import minimize

def load_data(file_path):
    # 更新列名以包含PPL
    df = pd.read_csv(file_path, sep=r'\s+', engine='python', encoding='utf-16')
    df.columns = ['INDEX', 'CODE', 'MATH', 'GENERAL', '平均RL-LOSS', '最大RL-LOSS', 'PPL']
    
    # 验证比例总和
    df['比例总和'] = df['CODE'] + df['MATH'] + df['GENERAL']
    df = df[np.isclose(df['比例总和'], 1.0, atol=0.01)].copy()
    
    return df[['CODE', 'MATH', 'GENERAL', '平均RL-LOSS', '最大RL-LOSS', 'PPL']]

def train_model(X, y):
    pipeline = Pipeline([
        ('scaler', StandardScaler()),
        ('regressor', GradientBoostingRegressor(
            n_estimators=200,
            max_depth=4,
            learning_rate=0.05,
            random_state=42
        ))
    ])
    model = TransformedTargetRegressor(regressor=pipeline, func=np.log1p, inverse_func=np.expm1)
    model.fit(X, y)

    # 提取GBDT模型
    if isinstance(model, TransformedTargetRegressor):
        if isinstance(model.regressor_, Pipeline):
            gbdt = model.regressor_.named_steps['regressor']
        else:
            gbdt = model.regressor_
    else:
        gbdt = model

    # 特征重要性分析
    print("\n🔎   特征重要性 (feature_importances_):")
    importances = gbdt.feature_importances_
    sorted_idx = importances.argsort()[::-1]
    top_n = 10
    for i in sorted_idx[:top_n]:
        print(f"  {X.columns[i]}: {importances[i]:.6f}")

    # 树的数量信息
    print(f"\n🌳   模型共训练了 {len(gbdt.estimators_)} 棵树")

    # 预测示例
    print("\n📦   前几棵树在前几个样本上的预测值（示例）:")
    for tree_id in range(min(3, len(gbdt.estimators_))):
        tree = gbdt.estimators_[tree_id][0]
        preds = tree.predict(X[:3])
        print(f"  第 {tree_id+1} 棵树预测值: {preds}")

    print("\n🧮 模型最终预测值（前几个样本）:")
    final_preds = model.predict(X[:3])
    print(final_preds)

    return model

def train_model_ridge(X, y):
    pipeline = Pipeline([
        ('scaler', StandardScaler()),
        ('regressor', Ridge(alpha=0.5))
    ])
    model = TransformedTargetRegressor(
        regressor=pipeline,
        func=np.log1p,
        inverse_func=np.expm1
    )
    model.fit(X, y)
    if isinstance(model, TransformedTargetRegressor):
        pipeline = model.regressor_
    else:
        pipeline = model  # 直接是 pipeline

    # 从 pipeline 中取出 Ridge 模型
    ridge = pipeline.named_steps['regressor']

    # 打印参数值
    print("🧮 岭回归模型参数值：")
    for feature, coef in zip(X.columns, ridge.coef_):
        print(f"  β({feature}): {coef:.6f}")

    print(f"  截距项 β₀ (intercept): {ridge.intercept_:.6f}")
    return model

def train_model_rf(X, y):
    model = RandomForestRegressor(
        n_estimators=150,
        max_depth=5,
        min_samples_split=5,
        random_state=42
    )
    model = TransformedTargetRegressor(
        regressor=model,
        func=np.log1p,
        inverse_func=np.expm1
    )
    model.fit(X, y)
    top_n = 10
    # 取出随机森林核心模型
    if isinstance(model, TransformedTargetRegressor):
        rf = model.regressor_
        # 可能还包了 Pipeline，按需处理（这里直接假设没包 Pipeline）
        if hasattr(rf, 'named_steps'):
            rf = rf.named_steps['regressor']
    else:
        rf = model

    print("\n🌲  随机森林模型训练后参数值：")

    # 特征重要性
    importances = rf.feature_importances_
    sorted_idx = importances.argsort()[::-1]
    print("\n🔎  特征重要性 (feature_importances_):")
    for i in sorted_idx[:top_n]:
        print(f"  {X.columns[i]}: {importances[i]:.6f}")

    # 估计器数量
    print(f"\n🌳  模型共训练了 {len(rf.estimators_)} 棵树")

    # 展示前3棵树在前3个样本上的预测（示例）
    print("\n📦  前几棵树在前几个样本上的预测值（示例）:")
    for tree_id in range(min(3, len(rf.estimators_))):
        tree = rf.estimators_[tree_id]
        preds = tree.predict(X[:3])
        print(f"  第 {tree_id+1} 棵树预测值: {preds}")

    # 总体预测值（前3个样本）
    print("\n🧮 模型最终预测值（前几个样本）:")
    final_preds = model.predict(X[:3])
    print(final_preds)
    return model


def train_model_lasso(X, y):
    pipeline = Pipeline([
        ('scaler', StandardScaler()),
        ('regressor', Lasso(alpha=0.01))
    ])
    model = TransformedTargetRegressor(
        regressor=pipeline,
        func=np.log1p,
        inverse_func=np.expm1
    )
    model.fit(X, y)
    # 取出核心模型
    if isinstance(model, TransformedTargetRegressor):
        inner = model.regressor_
        if isinstance(inner, Pipeline):
            lasso = inner.named_steps['regressor']
        else:
            lasso = inner
    else:
        lasso = model

    print("\n🖊️  Lasso 回归训练后回归系数 (coef_):")
    coefs = lasso.coef_
    for i, col in enumerate(X.columns):
        print(f"  {col}: {coefs[i]:.6f}")

    if hasattr(lasso, 'intercept_'):
        print(f"\n截距 intercept_: {lasso.intercept_:.6f}")
    return model

def optimize_with_grid_and_refine(model, coarse_step=0.005):
    """
    粗网格搜索 + 局部优化精修，寻找目标最小化组合
    """
    # 粗网格搜索
    grid = np.arange(0.0001, 1.0, coarse_step)  # 上限改为1.0以避免边界问题
    best_cfg = None
    best_loss = float('inf')

    for code in grid:
        for math in grid:
            general = 1.0 - code - math
            if general >= 0:  # 允许等于0
                X_input = pd.DataFrame([[code, math, general]], columns=['CODE', 'MATH', 'GENERAL'])
                pred = model.predict(X_input)[0]
                if pred < best_loss:
                    best_loss = pred
                    best_cfg = (code, math, general)

    print(f"🟡 粗网格搜索初始最优点: CODE={best_cfg[0]:.3f}, MATH={best_cfg[1]:.3f}, GENERAL={best_cfg[2]:.3f}, 目标值={best_loss:.6f}")

    # 局部优化精修
    def loss_fn(x):
        code, math = x
        general = 1.0 - code - math
        if general < 0:  # 只检查负值
            return 1e9  # 更大的惩罚值
        X = pd.DataFrame([[code, math, general]], columns=['CODE', 'MATH', 'GENERAL'])
        return model.predict(X)[0]

    x0 = [best_cfg[0], best_cfg[1]]
    bounds = [(0.001, 0.999), (0.001, 0.999)]  # 避免0和1的边界值
    
    # 添加容差的约束条件
    constraints = (
        {'type': 'ineq', 'fun': lambda x: 1.0 - x[0] - x[1] - 1e-5},  # general >= 0
        {'type': 'ineq', 'fun': lambda x: x[0] + x[1] - 1e-5}        # general <= 1
    )

    result = minimize(loss_fn, x0, method='SLSQP', bounds=bounds, constraints=constraints)

    if result.success:
        code, math = result.x
        general = 1.0 - code - math
        min_loss = result.fun
        print(f"✅  优化成功: CODE={code:.3f}, MATH={math:.3f}, GENERAL={general:.3f}, 目标值={min_loss:.6f}")
        return (code, math, general), min_loss
    else:
        print(f"⚠️  优化失败: {result.message}")
        print(f"⚠️  使用粗网格搜索结果: CODE={best_cfg[0]:.3f}, MATH={best_cfg[1]:.3f}, GENERAL={best_cfg[2]:.3f}")
        return best_cfg, best_loss


def main():
    file_path = '1M_data_config.txt'
    df = load_data(file_path)
    X = df[['CODE', 'MATH', 'GENERAL']]

    # 用于存储所有目标的结果
    summary = {}

    # 为每个目标分别建模和优化
    for target in ['平均RL-LOSS', '最大RL-LOSS', 'PPL']:
        y = df[target]
        print(f"\n{'='*50}")
        print(f"📌  正在拟合模型预测 {target} ...")
        print(f"{'='*50}")
        
        model = train_model(X, y)
       # model = train_model_ridge(X, y)
       # model = train_model_rf(X, y)
       # model = train_model_lasso(X, y)

        best_cfg, best_loss = optimize_with_grid_and_refine(model)

        summary[target] = {
            'CODE': best_cfg[0],
            'MATH': best_cfg[1],
            'GENERAL': best_cfg[2],
            'LOSS': best_loss
        }

        print(f"\n🔍  [{target}] 最优配比结果:")
        print(f"  CODE    = {best_cfg[0]:.4f}")
        print(f"  MATH    = {best_cfg[1]:.4f}")
        print(f"  GENERAL = {best_cfg[2]:.4f}")
        print(f"  预测{target} = {best_loss:.6f}")

    # 打印对比结果表格
    print("\n📊  最优配比结果对比:")
    print("目标           CODE     MATH     GENERAL   最小值")
    for target in ['平均RL-LOSS', '最大RL-LOSS', 'PPL']:
        res = summary[target]
        print(f"{target:<13} {res['CODE']:.4f}   {res['MATH']:.4f}   {res['GENERAL']:.4f}   {res['LOSS']:.6f}")

if __name__ == "__main__":
    main()
