# 只更新候选变量的特征

import random
import numpy as np
import torch
import argparse
import scipy.sparse as sp
import dgl
import pickle, gzip
import sys
import itertools
from pyscipopt import SCIP_PARAMSETTING, Model, Branchrule, Nodesel, SCIP_RESULT
from torch.utils.data import Dataset
from treelib import Tree
sys.path.append('../')
from src.logger import Logger
from src.model import GCNN_Net, PD_Net
import time
import torch.nn.functional as F
logger = Logger.logger
import time



def extract_state_new_37_col(model, buffer=None):

    buffer = {}

    s, cands, cands_pos = model.getGcnnCandsStateCol()

    buffer['scip_state'] = s

    if 'state' in buffer:
        obj_norm = buffer['state']['obj_norm']
    else:
        obj_norm = np.linalg.norm(s['col']['coefs'])
        obj_norm = 1 if obj_norm <= 0 else obj_norm

    # 列的功能 -> 变量特征
    # Column features
    n_cols = len(s['col']['types'])

    if 'state' in buffer:
        col_feats = buffer['state']['col_feats']
    else:
        col_feats = {}
        col_feats['type'] = np.zeros((n_cols, 4))  # BINARY INTEGER IMPLINT CONTINUOUS
        col_feats['type'][np.arange(n_cols), s['col']['types']] = 1
        col_feats['coef_normalized'] = s['col']['coefs'].reshape(-1, 1) / obj_norm

    col_feats['has_lb'] = ~np.isnan(s['col']['lbs']).reshape(-1, 1)
    col_feats['has_ub'] = ~np.isnan(s['col']['ubs']).reshape(-1, 1)
    
    col_feats['sol_is_at_lb'] = s['col']['sol_is_at_lb'].reshape(-1, 1)
    col_feats['sol_is_at_ub'] = s['col']['sol_is_at_ub'].reshape(-1, 1)
    col_feats['sol_frac'] = s['col']['solfracs'].reshape(-1, 1)
    col_feats['sol_frac'][s['col']['types'] == 3] = 0  # continuous have no fractionality
    col_feats['basis_status'] = np.zeros((n_cols, 4))  # LOWER BASIC UPPER ZERO
    col_feats['basis_status'][np.arange(n_cols), s['col']['basestats']] = 1
    col_feats['reduced_cost'] = s['col']['redcosts'].reshape(-1, 1) / obj_norm
    col_feats['age'] = s['col']['ages'].reshape(-1, 1) / (s['stats']['nlps'] + 5)
    col_feats['sol_val'] = s['col']['solvals'].reshape(-1, 1)
    # col_feats['inc_val'] = s['col']['incvals'].reshape(-1, 1)
    # col_feats['avg_inc_val'] = s['col']['avgincvals'].reshape(-1, 1)
    
    col_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in col_feats.items()]
    col_feat_names = [n for names in col_feat_names for n in names]
    col_feat_vals = np.concatenate(list(col_feats.values()), axis=-1)

    variable_features = {
        'names': col_feat_names,
        'values': col_feat_vals,}

    state_cands_col = {
        'variable_features' : variable_features
    }

    return state_cands_col, cands, cands_pos


def extract_state_new_37_all(model, buffer=None):

    buffer = {}

    s, cands, cands_pos = model.getGcnnCandsState()

    buffer['scip_state'] = s

    if 'state' in buffer:
        obj_norm = buffer['state']['obj_norm']
    else:
        obj_norm = np.linalg.norm(s['col']['coefs'])
        obj_norm = 1 if obj_norm <= 0 else obj_norm

    row_norms = s['row']['norms']
    row_norms[row_norms == 0] = 1

    # 列的功能 -> 变量特征
    # Column features
    n_cols = len(s['col']['types'])

    if 'state' in buffer:
        col_feats = buffer['state']['col_feats']
    else:
        col_feats = {}
        col_feats['type'] = np.zeros((n_cols, 4))  # BINARY INTEGER IMPLINT CONTINUOUS
        col_feats['type'][np.arange(n_cols), s['col']['types']] = 1
        col_feats['coef_normalized'] = s['col']['coefs'].reshape(-1, 1) / obj_norm

    col_feats['has_lb'] = ~np.isnan(s['col']['lbs']).reshape(-1, 1)
    col_feats['has_ub'] = ~np.isnan(s['col']['ubs']).reshape(-1, 1)
    
    col_feats['sol_is_at_lb'] = s['col']['sol_is_at_lb'].reshape(-1, 1)
    col_feats['sol_is_at_ub'] = s['col']['sol_is_at_ub'].reshape(-1, 1)
    col_feats['sol_frac'] = s['col']['solfracs'].reshape(-1, 1)
    col_feats['sol_frac'][s['col']['types'] == 3] = 0  # continuous have no fractionality
    col_feats['basis_status'] = np.zeros((n_cols, 4))  # LOWER BASIC UPPER ZERO
    col_feats['basis_status'][np.arange(n_cols), s['col']['basestats']] = 1
    col_feats['reduced_cost'] = s['col']['redcosts'].reshape(-1, 1) / obj_norm
    col_feats['age'] = s['col']['ages'].reshape(-1, 1) / (s['stats']['nlps'] + 5)
    col_feats['sol_val'] = s['col']['solvals'].reshape(-1, 1)
    # col_feats['inc_val'] = s['col']['incvals'].reshape(-1, 1)
    # col_feats['avg_inc_val'] = s['col']['avgincvals'].reshape(-1, 1)
    

    col_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in col_feats.items()]
    col_feat_names = [n for names in col_feat_names for n in names]
    col_feat_vals = np.concatenate(list(col_feats.values()), axis=-1)
    # col_feat_vals.shape : 1000,19

    variable_features = {
        'names': col_feat_names,
        'values': col_feat_vals,}

    # 行的功能 -> 约束特征
    # Row features

    if 'state' in buffer:
        row_feats = buffer['state']['row_feats']
        has_lhs = buffer['state']['has_lhs']
        has_rhs = buffer['state']['has_rhs']
    else:
        row_feats = {}
        has_lhs = np.nonzero(~np.isnan(s['row']['lhss']))[0]
        has_rhs = np.nonzero(~np.isnan(s['row']['rhss']))[0]

        row_feats['obj_cosine_similarity'] = np.concatenate((
            -s['row']['objcossims'][has_lhs],
            +s['row']['objcossims'][has_rhs])).reshape(-1, 1)
        
        row_feats['bias'] = np.concatenate((
            -(s['row']['lhss'] / row_norms)[has_lhs],
            +(s['row']['rhss'] / row_norms)[has_rhs])).reshape(-1, 1)

    row_feats['is_tight'] = np.concatenate((
        s['row']['is_at_lhs'][has_lhs],
        s['row']['is_at_rhs'][has_rhs])).reshape(-1, 1)

    row_feats['age'] = np.concatenate((
        s['row']['ages'][has_lhs],
        s['row']['ages'][has_rhs])).reshape(-1, 1) / (s['stats']['nlps'] + 5)

    # todo: check whether this change helps
    tmp = s['row']['dualsols'] / (row_norms * obj_norm)
    # tmp = s['row']['dualsols'] * row_norms / obj_norm
    row_feats['dualsol_val_normalized'] = np.concatenate((
            -tmp[has_lhs],
            +tmp[has_rhs])).reshape(-1, 1)

    row_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in row_feats.items()]
    row_feat_names = [n for names in row_feat_names for n in names]
    row_feat_vals = np.concatenate(list(row_feats.values()), axis=-1)


    constraint_features = {
        'names': row_feat_names,
        'values': row_feat_vals,}

    # 边特征
    # Edge features
    if 'state' in buffer:
        edge_row_idxs = buffer['state']['edge_row_idxs']
        edge_col_idxs = buffer['state']['edge_col_idxs']
        edge_feats = buffer['state']['edge_feats']
    else:
        # 权重/范数
        coef_matrix = sp.csr_matrix(
            (s['nzrcoef']['vals'] / row_norms[s['nzrcoef']['rowidxs']],
            (s['nzrcoef']['rowidxs'], s['nzrcoef']['colidxs'])),
            # shape=(len(s['row']['nnzrs']), len(s['col']['types'])))
            shape=(len(s['row']['lhss']), len(s['col']['types'])))

        coef_matrix = sp.vstack((
            -coef_matrix[has_lhs, :],
            coef_matrix[has_rhs, :])).tocoo(copy=False)

        edge_row_idxs, edge_col_idxs = coef_matrix.row, coef_matrix.col
        edge_feats = {}

        edge_feats['coef_normalized'] = coef_matrix.data.reshape(-1, 1)

    edge_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in edge_feats.items()]
    edge_feat_names = [n for names in edge_feat_names for n in names]
    edge_feat_indices = np.vstack([edge_row_idxs, edge_col_idxs])
    edge_feat_vals = np.concatenate(list(edge_feats.values()), axis=-1)

    edge_features = {
        'names': edge_feat_names,
        'indices': edge_feat_indices,
        'values': edge_feat_vals,}

    if 'state' not in buffer:
        buffer['state'] = {
            'obj_norm': obj_norm,
            'col_feats': col_feats,
            'row_feats': row_feats,
            'has_lhs': has_lhs,
            'has_rhs': has_rhs,
            'edge_row_idxs': edge_row_idxs,
            'edge_col_idxs': edge_col_idxs,
            'edge_feats': edge_feats,
        }


    state_cands_all = {
        'constraint_features' : constraint_features,
        'edge_features' : edge_features,
        'variable_features' : variable_features
    }

    return state_cands_all, cands, cands_pos


def extract_state_new_37_base(model, buffer=None):

    if buffer is None or model.getNNodes() == 1:
        buffer = {}

    # 从缓冲区中更新状态
    # update state from buffer if any

    s = model.getState(buffer['scip_state'] if 'scip_state' in buffer else None)

    buffer['scip_state'] = s

    if 'state' in buffer:
        obj_norm = buffer['state']['obj_norm']
    else:
        obj_norm = np.linalg.norm(s['col']['coefs'])
        obj_norm = 1 if obj_norm <= 0 else obj_norm

    row_norms = s['row']['norms']
    row_norms[row_norms == 0] = 1

    # 列的功能 -> 变量特征
    # Column features
    n_cols = len(s['col']['types'])

    if 'state' in buffer:
        col_feats = buffer['state']['col_feats']
    else:
        col_feats = {}
        col_feats['type'] = np.zeros((n_cols, 4))  # BINARY INTEGER IMPLINT CONTINUOUS
        col_feats['type'][np.arange(n_cols), s['col']['types']] = 1
        col_feats['coef_normalized'] = s['col']['coefs'].reshape(-1, 1) / obj_norm

    col_feats['has_lb'] = ~np.isnan(s['col']['lbs']).reshape(-1, 1)
    col_feats['has_ub'] = ~np.isnan(s['col']['ubs']).reshape(-1, 1)
    
    col_feats['sol_is_at_lb'] = s['col']['sol_is_at_lb'].reshape(-1, 1)
    col_feats['sol_is_at_ub'] = s['col']['sol_is_at_ub'].reshape(-1, 1)
    col_feats['sol_frac'] = s['col']['solfracs'].reshape(-1, 1)
    col_feats['sol_frac'][s['col']['types'] == 3] = 0  # continuous have no fractionality
    col_feats['basis_status'] = np.zeros((n_cols, 4))  # LOWER BASIC UPPER ZERO
    col_feats['basis_status'][np.arange(n_cols), s['col']['basestats']] = 1
    col_feats['reduced_cost'] = s['col']['redcosts'].reshape(-1, 1) / obj_norm
    col_feats['age'] = s['col']['ages'].reshape(-1, 1) / (s['stats']['nlps'] + 5)
    col_feats['sol_val'] = s['col']['solvals'].reshape(-1, 1)
    # col_feats['inc_val'] = s['col']['incvals'].reshape(-1, 1)
    # col_feats['avg_inc_val'] = s['col']['avgincvals'].reshape(-1, 1)




    col_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in col_feats.items()]
    col_feat_names = [n for names in col_feat_names for n in names]
    col_feat_vals = np.concatenate(list(col_feats.values()), axis=-1)

    variable_features = {
        'names': col_feat_names,
        'values': col_feat_vals,}

    # 行的功能 -> 约束特征
    # Row features

    if 'state' in buffer:
        row_feats = buffer['state']['row_feats']
        has_lhs = buffer['state']['has_lhs']
        has_rhs = buffer['state']['has_rhs']
    else:
        row_feats = {}
        has_lhs = np.nonzero(~np.isnan(s['row']['lhss']))[0]
        has_rhs = np.nonzero(~np.isnan(s['row']['rhss']))[0]

        row_feats['obj_cosine_similarity'] = np.concatenate((
            -s['row']['objcossims'][has_lhs],
            +s['row']['objcossims'][has_rhs])).reshape(-1, 1)
        
        row_feats['bias'] = np.concatenate((
            -(s['row']['lhss'] / row_norms)[has_lhs],
            +(s['row']['rhss'] / row_norms)[has_rhs])).reshape(-1, 1)

    row_feats['is_tight'] = np.concatenate((
        s['row']['is_at_lhs'][has_lhs],
        s['row']['is_at_rhs'][has_rhs])).reshape(-1, 1)

    row_feats['age'] = np.concatenate((
        s['row']['ages'][has_lhs],
        s['row']['ages'][has_rhs])).reshape(-1, 1) / (s['stats']['nlps'] + 5)

    # todo: check whether this change helps
    tmp = s['row']['dualsols'] / (row_norms * obj_norm)
    # tmp = s['row']['dualsols'] * row_norms / obj_norm
    row_feats['dualsol_val_normalized'] = np.concatenate((
            -tmp[has_lhs],
            +tmp[has_rhs])).reshape(-1, 1)


    row_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in row_feats.items()]
    row_feat_names = [n for names in row_feat_names for n in names]
    row_feat_vals = np.concatenate(list(row_feats.values()), axis=-1)




    constraint_features = {
        'names': row_feat_names,
        'values': row_feat_vals,}

    # 边特征
    # Edge features
    if 'state' in buffer:
        edge_row_idxs = buffer['state']['edge_row_idxs']
        edge_col_idxs = buffer['state']['edge_col_idxs']
        edge_feats = buffer['state']['edge_feats']
    else:
        # 权重/范数
        coef_matrix = sp.csr_matrix(
            (s['nzrcoef']['vals'] / row_norms[s['nzrcoef']['rowidxs']],
            (s['nzrcoef']['rowidxs'], s['nzrcoef']['colidxs'])),
            shape=(len(s['row']['nnzrs']), len(s['col']['types'])))
        coef_matrix = sp.vstack((
            -coef_matrix[has_lhs, :],
            coef_matrix[has_rhs, :])).tocoo(copy=False)

        edge_row_idxs, edge_col_idxs = coef_matrix.row, coef_matrix.col
        edge_feats = {}

        edge_feats['coef_normalized'] = coef_matrix.data.reshape(-1, 1)

    edge_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in edge_feats.items()]
    edge_feat_names = [n for names in edge_feat_names for n in names]
    edge_feat_indices = np.vstack([edge_row_idxs, edge_col_idxs])
    edge_feat_vals = np.concatenate(list(edge_feats.values()), axis=-1)

    edge_features = {
        'names': edge_feat_names,
        'indices': edge_feat_indices,
        'values': edge_feat_vals,}

    if 'state' not in buffer:
        buffer['state'] = {
            'obj_norm': obj_norm,
            'col_feats': col_feats,
            'row_feats': row_feats,
            'has_lhs': has_lhs,
            'has_rhs': has_rhs,
            'edge_row_idxs': edge_row_idxs,
            'edge_col_idxs': edge_col_idxs,
            'edge_feats': edge_feats,
        }


    state_base = {
        'constraint_features' : constraint_features,
        'edge_features' : edge_features,
        'variable_features' : variable_features
    }

    return state_base, edge_features, variable_features


def extract_state_new_37_time(model, buffer=None):

    if buffer is None or model.getNNodes() == 1:
        buffer = {}

    # 从缓冲区中更新状态
    # update state from buffer if any
    
    time_1 = time.time()
    s, cands, cands_pos = model.getState_new_37_cands_time_test(buffer['scip_state'] if 'scip_state' in buffer else None)
    print(f"@@@@@@@@@@@@@@@@ now getState_new_37_cands_time_test:\t{time.time()-time_1}")

    time_start_get_start = time.time()

    buffer['scip_state'] = s

    if 'state' in buffer:
        obj_norm = buffer['state']['obj_norm']
    else:
        obj_norm = np.linalg.norm(s['col']['coefs'])
        obj_norm = 1 if obj_norm <= 0 else obj_norm

    row_norms = s['row']['norms']
    row_norms[row_norms == 0] = 1

    # 列的功能 -> 变量特征
    # Column features
    n_cols = len(s['col']['types'])

    if 'state' in buffer:
        col_feats = buffer['state']['col_feats']
    else:
        col_feats = {}
        col_feats['type'] = np.zeros((n_cols, 4))  # BINARY INTEGER IMPLINT CONTINUOUS
        col_feats['type'][np.arange(n_cols), s['col']['types']] = 1
        col_feats['coef_normalized'] = s['col']['coefs'].reshape(-1, 1) / obj_norm

    col_feats['has_lb'] = ~np.isnan(s['col']['lbs']).reshape(-1, 1)
    col_feats['has_ub'] = ~np.isnan(s['col']['ubs']).reshape(-1, 1)
    
    col_feats['sol_is_at_lb'] = s['col']['sol_is_at_lb'].reshape(-1, 1)
    col_feats['sol_is_at_ub'] = s['col']['sol_is_at_ub'].reshape(-1, 1)
    col_feats['sol_frac'] = s['col']['solfracs'].reshape(-1, 1)
    col_feats['sol_frac'][s['col']['types'] == 3] = 0  # continuous have no fractionality
    col_feats['basis_status'] = np.zeros((n_cols, 4))  # LOWER BASIC UPPER ZERO
    col_feats['basis_status'][np.arange(n_cols), s['col']['basestats']] = 1
    col_feats['reduced_cost'] = s['col']['redcosts'].reshape(-1, 1) / obj_norm
    col_feats['age'] = s['col']['ages'].reshape(-1, 1) / (s['stats']['nlps'] + 5)
    col_feats['sol_val'] = s['col']['solvals'].reshape(-1, 1)
    col_feats['inc_val'] = s['col']['incvals'].reshape(-1, 1)
    col_feats['avg_inc_val'] = s['col']['avgincvals'].reshape(-1, 1)
    

    col_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in col_feats.items()]
    col_feat_names = [n for names in col_feat_names for n in names]
    col_feat_vals = np.concatenate(list(col_feats.values()), axis=-1)
    # col_feat_vals.shape : 1000,19

    variable_features = {
        'names': col_feat_names,
        'values': col_feat_vals,}

    # 行的功能 -> 约束特征
    # Row features

    if 'state' in buffer:
        row_feats = buffer['state']['row_feats']
        has_lhs = buffer['state']['has_lhs']
        has_rhs = buffer['state']['has_rhs']
    else:
        row_feats = {}
        has_lhs = np.nonzero(~np.isnan(s['row']['lhss']))[0]
        has_rhs = np.nonzero(~np.isnan(s['row']['rhss']))[0]

        row_feats['obj_cosine_similarity'] = np.concatenate((
            -s['row']['objcossims'][has_lhs],
            +s['row']['objcossims'][has_rhs])).reshape(-1, 1)
        
        row_feats['bias'] = np.concatenate((
            -(s['row']['lhss'] / row_norms)[has_lhs],
            +(s['row']['rhss'] / row_norms)[has_rhs])).reshape(-1, 1)

    row_feats['is_tight'] = np.concatenate((
        s['row']['is_at_lhs'][has_lhs],
        s['row']['is_at_rhs'][has_rhs])).reshape(-1, 1)

    row_feats['age'] = np.concatenate((
        s['row']['ages'][has_lhs],
        s['row']['ages'][has_rhs])).reshape(-1, 1) / (s['stats']['nlps'] + 5)

    # todo: check whether this change helps
    tmp = s['row']['dualsols'] / (row_norms * obj_norm)
    # tmp = s['row']['dualsols'] * row_norms / obj_norm
    row_feats['dualsol_val_normalized'] = np.concatenate((
            -tmp[has_lhs],
            +tmp[has_rhs])).reshape(-1, 1)

    row_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in row_feats.items()]
    row_feat_names = [n for names in row_feat_names for n in names]
    row_feat_vals = np.concatenate(list(row_feats.values()), axis=-1)


    constraint_features = {
        'names': row_feat_names,
        'values': row_feat_vals,}

    # 边特征
    # Edge features
    if 'state' in buffer:
        edge_row_idxs = buffer['state']['edge_row_idxs']
        edge_col_idxs = buffer['state']['edge_col_idxs']
        edge_feats = buffer['state']['edge_feats']
    else:
        # 权重/范数
        coef_matrix = sp.csr_matrix(
            (s['nzrcoef']['vals'] / row_norms[s['nzrcoef']['rowidxs']],
            (s['nzrcoef']['rowidxs'], s['nzrcoef']['colidxs'])),
            shape=(len(s['row']['nnzrs']), len(s['col']['types'])))
            # # new
            # shape=(len(s['col']['nnzrs']), len(s['col']['types'])))
        coef_matrix = sp.vstack((
            -coef_matrix[has_lhs, :],
            coef_matrix[has_rhs, :])).tocoo(copy=False)

        edge_row_idxs, edge_col_idxs = coef_matrix.row, coef_matrix.col
        edge_feats = {}

        edge_feats['coef_normalized'] = coef_matrix.data.reshape(-1, 1)

    edge_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in edge_feats.items()]
    edge_feat_names = [n for names in edge_feat_names for n in names]
    edge_feat_indices = np.vstack([edge_row_idxs, edge_col_idxs])
    edge_feat_vals = np.concatenate(list(edge_feats.values()), axis=-1)

    # print("edge_feats.key():",edge_feats.keys())
    # for key in edge_feats.keys():
    #     print("edge_feats.",key,".shape:",edge_feats[key].shape)
    
    # edge_feats.key(): dict_keys(['coef_normalized'])
    # edge_feats. coef_normalized .shape: (34861, 1)
    
    # edge_feat_vals.shape:(34861, 1)

    edge_features = {
        'names': edge_feat_names,
        'indices': edge_feat_indices,
        'values': edge_feat_vals,}

    if 'state' not in buffer:
        buffer['state'] = {
            'obj_norm': obj_norm,
            'col_feats': col_feats,
            'row_feats': row_feats,
            'has_lhs': has_lhs,
            'has_rhs': has_rhs,
            'edge_row_idxs': edge_row_idxs,
            'edge_col_idxs': edge_col_idxs,
            'edge_feats': edge_feats,
        }

    print(f"@@@@@@@@@@@@@@@@ 37 getState fun time:{time.time()-time_start_get_start}")

    return constraint_features, edge_features, variable_features, cands, cands_pos


# 将scip模型当前的特征转换成GCNN模型二部图表示，其中变量和约束是两端的节点。
def extract_state_baseline_time(model, buffer=None):
    """
    计算求解器的二部图表示。在这种表示中，MILP的变量和约束是左右两边的节点，
    如果变量涉及约束，则一条边连接两个节点。节点和边都带有特征。
    Compute a bipartite graph representation of the solver. In this
    representation, the variables and constraints of the MILP are the
    left- and right-hand side nodes, and an edge links two nodes iff the
    variable is involved in the constraint. Both the nodes and edges carry
    features.
    
    Parameters
    ----------
    model : pyscipopt.scip.Model
        The current model.
        当前的scip模型
    buffer : dict
        A buffer to avoid re-extracting redundant information from the solver
        each time.
        缓冲区，以避免每次从解算器中重新提取冗余信息。
    Returns
    -------
    variable_features : dictionary of type {'names': list, 'values': np.ndarray}
        The features associated with the variable nodes in the bipartite graph.
        二部图中与变量节点相关的特征。
        这是一个稀疏矩阵在COO格式给出。
    edge_features : dictionary of type ('names': list, 'indices': np.ndarray, 'values': np.ndarray}
        The features associated with the edges in the bipartite graph.
        This is given as a sparse matrix in COO format.
        二部图中与边有关的特征。这是一个在COO格式的稀疏矩阵。
    constraint_features : dictionary of type {'names': list, 'values': np.ndarray}
        The features associated with the constraint nodes in the bipartite graph.
        二部图中与约束节点相关的特征。
    """
    if buffer is None or model.getNNodes() == 1:
        buffer = {}

    # 从缓冲区中更新状态
    # update state from buffer if any

    time_1 = time.time()
    s = model.getState_time_test(buffer['scip_state'] if 'scip_state' in buffer else None)
    print(f"@@@@@@@@@@@@@@@@ now baseline getstate:{time.time()-time_1}")

    time_start_get_start = time.time()

    buffer['scip_state'] = s

    if 'state' in buffer:
        obj_norm = buffer['state']['obj_norm']
    else:
        obj_norm = np.linalg.norm(s['col']['coefs'])
        obj_norm = 1 if obj_norm <= 0 else obj_norm

    row_norms = s['row']['norms']
    row_norms[row_norms == 0] = 1

    # 列的功能 -> 变量特征
    # Column features
    n_cols = len(s['col']['types'])

    if 'state' in buffer:
        col_feats = buffer['state']['col_feats']
    else:
        col_feats = {}
        col_feats['type'] = np.zeros((n_cols, 4))  # BINARY INTEGER IMPLINT CONTINUOUS
        col_feats['type'][np.arange(n_cols), s['col']['types']] = 1
        col_feats['coef_normalized'] = s['col']['coefs'].reshape(-1, 1) / obj_norm

    col_feats['has_lb'] = ~np.isnan(s['col']['lbs']).reshape(-1, 1)
    col_feats['has_ub'] = ~np.isnan(s['col']['ubs']).reshape(-1, 1)
    
    col_feats['sol_is_at_lb'] = s['col']['sol_is_at_lb'].reshape(-1, 1)
    col_feats['sol_is_at_ub'] = s['col']['sol_is_at_ub'].reshape(-1, 1)
    col_feats['sol_frac'] = s['col']['solfracs'].reshape(-1, 1)
    col_feats['sol_frac'][s['col']['types'] == 3] = 0  # continuous have no fractionality
    col_feats['basis_status'] = np.zeros((n_cols, 4))  # LOWER BASIC UPPER ZERO
    col_feats['basis_status'][np.arange(n_cols), s['col']['basestats']] = 1
    col_feats['reduced_cost'] = s['col']['redcosts'].reshape(-1, 1) / obj_norm
    col_feats['age'] = s['col']['ages'].reshape(-1, 1) / (s['stats']['nlps'] + 5)
    col_feats['sol_val'] = s['col']['solvals'].reshape(-1, 1)
    col_feats['inc_val'] = s['col']['incvals'].reshape(-1, 1)
    col_feats['avg_inc_val'] = s['col']['avgincvals'].reshape(-1, 1)


    # print("col_feats.key():",col_feats.keys())
    # for key in col_feats.keys():
    #     print("col_feats.",key,".shape:",col_feats[key].shape)

    #keys:'type', 'coef_normalized', 'has_lb', 'has_ub', 'sol_is_at_lb', 'sol_is_at_ub', 'sol_frac', 'basis_status', 'reduced_cost', 'age', 'sol_val', 'inc_val', 'avg_inc_val']
    # 4  col_feats. type .shape: (1000, 4)
    # 5  col_feats. coef_normalized .shape: (1000, 1)
    # 6  col_feats. has_lb .shape: (1000, 1)
    # 7  col_feats. has_ub .shape: (1000, 1)
    # 8  col_feats. sol_is_at_lb .shape: (1000, 1)
    # 9  col_feats. sol_is_at_ub .shape: (1000, 1)
    # 10 col_feats. sol_frac .shape: (1000, 1)
    # 14 col_feats. basis_status .shape: (1000, 4)
    # 15 col_feats. reduced_cost .shape: (1000, 1)
    # 16 col_feats. age .shape: (1000, 1)
    # 17 col_feats. sol_val .shape: (1000, 1)
    # 18 col_feats. inc_val .shape: (1000, 1)
    # 19 col_feats. avg_inc_val .shape: (1000, 1)
    



    col_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in col_feats.items()]
    col_feat_names = [n for names in col_feat_names for n in names]
    col_feat_vals = np.concatenate(list(col_feats.values()), axis=-1)
    # col_feat_vals.shape : 1000,19

    variable_features = {
        'names': col_feat_names,
        'values': col_feat_vals,}

    # 行的功能 -> 约束特征
    # Row features

    if 'state' in buffer:
        row_feats = buffer['state']['row_feats']
        has_lhs = buffer['state']['has_lhs']
        has_rhs = buffer['state']['has_rhs']
    else:
        row_feats = {}
        has_lhs = np.nonzero(~np.isnan(s['row']['lhss']))[0]
        has_rhs = np.nonzero(~np.isnan(s['row']['rhss']))[0]

        row_feats['obj_cosine_similarity'] = np.concatenate((
            -s['row']['objcossims'][has_lhs],
            +s['row']['objcossims'][has_rhs])).reshape(-1, 1)
        
        row_feats['bias'] = np.concatenate((
            -(s['row']['lhss'] / row_norms)[has_lhs],
            +(s['row']['rhss'] / row_norms)[has_rhs])).reshape(-1, 1)

    row_feats['is_tight'] = np.concatenate((
        s['row']['is_at_lhs'][has_lhs],
        s['row']['is_at_rhs'][has_rhs])).reshape(-1, 1)

    row_feats['age'] = np.concatenate((
        s['row']['ages'][has_lhs],
        s['row']['ages'][has_rhs])).reshape(-1, 1) / (s['stats']['nlps'] + 5)

    # todo: check whether this change helps
    tmp = s['row']['dualsols'] / (row_norms * obj_norm)
    # tmp = s['row']['dualsols'] * row_norms / obj_norm
    row_feats['dualsol_val_normalized'] = np.concatenate((
            -tmp[has_lhs],
            +tmp[has_rhs])).reshape(-1, 1)


    # print("row_feats.key():",row_feats.keys())
    # for key in row_feats.keys():
    #     print("row_feats.",key,".shape:",row_feats[key].shape)

    # key(): dict_keys(['obj_cosine_similarity', 'bias', 'is_tight', 'age', 'dualsol_val_normalized'])
    # row_feats. obj_cosine_similarity .shape: (520, 1)
    # row_feats. bias .shape: (520, 1)
    # row_feats. is_tight .shape: (520, 1)
    # row_feats. age .shape: (520, 1)
    # row_feats. dualsol_val_normalized .shape: (520, 1)


    row_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in row_feats.items()]
    row_feat_names = [n for names in row_feat_names for n in names]
    row_feat_vals = np.concatenate(list(row_feats.values()), axis=-1)




    constraint_features = {
        'names': row_feat_names,
        'values': row_feat_vals,}

    # 边特征
    # Edge features
    if 'state' in buffer:
        edge_row_idxs = buffer['state']['edge_row_idxs']
        edge_col_idxs = buffer['state']['edge_col_idxs']
        edge_feats = buffer['state']['edge_feats']
    else:
        # 权重/范数
        coef_matrix = sp.csr_matrix(
            (s['nzrcoef']['vals'] / row_norms[s['nzrcoef']['rowidxs']],
            (s['nzrcoef']['rowidxs'], s['nzrcoef']['colidxs'])),
            shape=(len(s['row']['nnzrs']), len(s['col']['types'])))
        coef_matrix = sp.vstack((
            -coef_matrix[has_lhs, :],
            coef_matrix[has_rhs, :])).tocoo(copy=False)

        edge_row_idxs, edge_col_idxs = coef_matrix.row, coef_matrix.col
        edge_feats = {}

        edge_feats['coef_normalized'] = coef_matrix.data.reshape(-1, 1)

    edge_feat_names = [[k, ] if v.shape[1] == 1 else [f'{k}_{i}' for i in range(v.shape[1])] for k, v in edge_feats.items()]
    edge_feat_names = [n for names in edge_feat_names for n in names]
    edge_feat_indices = np.vstack([edge_row_idxs, edge_col_idxs])
    edge_feat_vals = np.concatenate(list(edge_feats.values()), axis=-1)

    # print("edge_feats.key():",edge_feats.keys())
    # for key in edge_feats.keys():
    #     print("edge_feats.",key,".shape:",edge_feats[key].shape)
    
    # edge_feats.key(): dict_keys(['coef_normalized'])
    # edge_feats. coef_normalized .shape: (34861, 1)
    
    # edge_feat_vals.shape:(34861, 1)

    edge_features = {
        'names': edge_feat_names,
        'indices': edge_feat_indices,
        'values': edge_feat_vals,}

    if 'state' not in buffer:
        buffer['state'] = {
            'obj_norm': obj_norm,
            'col_feats': col_feats,
            'row_feats': row_feats,
            'has_lhs': has_lhs,
            'has_rhs': has_rhs,
            'edge_row_idxs': edge_row_idxs,
            'edge_col_idxs': edge_col_idxs,
            'edge_feats': edge_feats,
        }

    print(f"@@@@@@@@@@@@@@@@ baseline getState fun time:{time.time()-time_start_get_start}")

    return constraint_features, edge_features, variable_features


def graph_transform_new_37_base(state_base):

    idx = state[1]['indices']
    # make sure that feature shape matches the graph
    # 确保特征形状与图形匹配
    v2c_index = (idx[1, :], idx[0, :])
    c2v_index = (idx[0, :], idx[1, :])

    # 获得边特征、约束特征、变量特征。
    edge_feats = torch.tensor(state[1]['values'], dtype=torch.float).view(-1, 1)
    c_feats = torch.tensor(state[0]['values'], dtype=torch.float)
    v_feats = torch.tensor(state[2]['values'][:,:17], dtype=torch.float)
    # 获得约束和变量的索引
    num_nodes_dict = {'c': c_feats.shape[0], 'v': v_feats.shape[0]}
    
    # 构建异构图，一个异构图由一系列子图构成，一个子图对应一种关系。
    # 每个关系由一个字符串三元组定义（源节点类型，边类型，目标节点类型）。
    graph = dgl.heterograph({
        ('v', 'v2c', 'c'): v2c_index,
        ('c', 'c2v', 'v'): c2v_index,
    }, num_nodes_dict)

    # 给异构图赋值
    graph.edges['v2c'].data['h'] = edge_feats
    graph.edges['c2v'].data['h'] = edge_feats
    graph.nodes['v'].data['h'] = v_feats
    graph.nodes['c'].data['h'] = c_feats

    # 返回异构图
    return graph

def graph_transform_new_37_all(state_all):

    state = [state_all["constraint_features"], state_all["edge_features"], state_all["variable_features"]]

    idx = state[1]['indices']
    # make sure that feature shape matches the graph
    # 确保特征形状与图形匹配
    v2c_index = (idx[1, :], idx[0, :])
    c2v_index = (idx[0, :], idx[1, :])

    # 获得边特征、约束特征、变量特征。
    edge_feats = torch.tensor(state[1]['values'], dtype=torch.float).view(-1, 1)
    c_feats = torch.tensor(state[0]['values'], dtype=torch.float)
    v_feats = torch.tensor(state[2]['values'][:,:17], dtype=torch.float)
    # 获得约束和变量的索引
    num_nodes_dict = {'c': c_feats.shape[0], 'v': v_feats.shape[0]}
    
    # 构建异构图，一个异构图由一系列子图构成，一个子图对应一种关系。
    # 每个关系由一个字符串三元组定义（源节点类型，边类型，目标节点类型）。
    graph = dgl.heterograph({
        ('v', 'v2c', 'c'): v2c_index,
        ('c', 'c2v', 'v'): c2v_index,
    }, num_nodes_dict)

    # 给异构图赋值
    graph.edges['v2c'].data['h'] = edge_feats
    graph.edges['c2v'].data['h'] = edge_feats
    graph.nodes['v'].data['h'] = v_feats
    graph.nodes['c'].data['h'] = c_feats

    # 返回异构图
    return graph

# 加载分支数据
class BranchDataset_new_37(Dataset):
    def __init__(self, dirs):
        super().__init__()
        self.data = []
        for dir in dirs:
            sample = pickle.load(gzip.open(dir, 'rb'))['data']
            root_state_base, state_base, state_cands_col, state_cands_all, bestcand, action_set, scores = sample

            label = bestcand
            candidates = action_set
            scores = scores
            self.data.append((root_state_base, state_base, state_cands_col, state_cands_all, candidates, label, scores))

    def __len__(self):
        return len(self.data)

    def __getitem__(self, idx):
        return self.data[idx]

# 整理dgl信息， 
def dgl_collate_new_37(batch):
    root_state_base, state_base, state_cands_col, state_cands_all, candidates, label, scores = map(list, zip(*batch))
    
    # root_graphs = []
    # for i in range(len(root_state_base)):    
    #     root_graphs.append(graph_transform_new_37_all(root_state_base[i]))
    # root_bg = dgl.batch(root_graphs)
    root_bg = None

    graphs = []
    for i in range(len(state_base)):    
        graphs.append(graph_transform_new_37_all(state_cands_all[i]))
    bg = dgl.batch(graphs)


    label = torch.LongTensor(label)

    root_index = []
    # for i in range(len(candidates)):
    #     now_len = 0
    #     for index in candidates[i]:
    #         root_index.append(index+now_len)
    #     now_len += len(root_state_base[i])

    return root_index, root_bg, bg, candidates, label, scores


def train_new_37(args, root_model, model, trainData, optimizer, epoch, log_interval, device):
    model.train()
    # root_model.eval()
    batch_loss = 0.0
    total_count = 0.0
    correct_count = 0.0
    hard_correct_count = 0.0
    for batch_idx, (root_index, root_bg, bg, candidates, label, scores) in enumerate(trainData):
        optimizer.zero_grad()
        # root_bg = root_bg.to(device)
        bg = bg.to(device)
        label = label.to(device)
        count = len(label)
        total_count += count
        
        # root_var_embeds = root_model.get_var_embeds(root_bg)
        # root_var_embeds = root_var_embeds[root_index]
        bg = model.forword_all(bg)

        graphs = dgl.unbatch(bg)
        logits = [g.nodes['v'].data['s'] for i, g in enumerate(graphs)]
        pred = [logits[i].argmax(dim=0) for i in range(count)]

        hard_correct_count += sum([candidates[i][pred[i]] == label[i] for i in range(count)]).item()
        correct_count += sum([scores[i][pred[i]] == max(scores[i]) for i in range(count)])

        loss = sum([F.cross_entropy(logits[i].T, label[i:i+1]) for i in range(count)]) / count


        loss.backward()
        optimizer.step()
        batch_loss += loss.item() * count

        if (batch_idx+1) % log_interval == 0:
            logger.info('Train epoch {}:\t [{}/{}({:.0f}%)]\tTrain Loss: {:.6f}\t Accuracy: {:.6f}\t Hard Accuracy: {:.6f}'.format(
                epoch + 1, batch_idx+1, len(trainData), 100. * (batch_idx+1) / len(trainData), batch_loss / total_count,
            correct_count / total_count, hard_correct_count/total_count))


def test_new_37(args, root_model, model, testData, optimizer, epoch, device):
    model.eval()
    # root_model.eval()
    batch_loss = 0
    correct_count = 0
    total_count = 0
    hard_correct_count = 0
    with torch.no_grad():
        for root_index, root_bg, bg, candidates, label, scores in testData:
            optimizer.zero_grad()
            # root_bg = root_bg.to(device)
            bg = bg.to(device)
            label = label.to(device)
            count = len(label)
            total_count += count

            # root_var_embeds = root_model.get_var_embeds(root_bg)
            # root_var_embeds = root_var_embeds[root_index]
            # bg = model(root_var_embeds, bg)
            bg = model.forword_all(bg)

            graphs = dgl.unbatch(bg)
            logits = [g.nodes['v'].data['s'] for i, g in enumerate(graphs)]

            pred = [logits[i].argmax(dim=0) for i in range(count)]
            hard_correct_count += sum([candidates[i][pred[i]] == label[i] for i in range(count)]).item()
            correct_count += sum([scores[i][pred[i]] == max(scores[i]) for i in range(count)])

            loss = sum([F.cross_entropy(logits[i].T, label[i:i + 1]) for i in range(count)]) / count

            batch_loss += loss.item() * count


    loss = batch_loss / total_count
    accuracy = correct_count / total_count
    hard_acc = hard_correct_count / total_count
    logger.info('Test epoch {}:\t Test Loss: {:.6f}\t Accuracy: {:.6f}\t Hard Accuracy: {:.6f}'.format(epoch + 1, loss, accuracy, hard_acc))
    return loss, accuracy, hard_acc
