import numpy as np
import torch
import xgboost as xgb

def bin_features(graph, train_idx):
    features = graph.ndata['feature'].cpu().numpy()
    labels = graph.ndata['label'].cpu().numpy()

    dtrain = xgb.DMatrix(features[train_idx], label=labels[train_idx])
    params = {
        'max_depth': 14,
        'eta': 0.1,
        'objective': 'binary:logistic',
        'eval_metric': 'logloss',
    }
    num_round = 300
    bst = xgb.train(params, dtrain, num_boost_round=num_round)

    ddata = xgb.DMatrix(features)
    leaf_indices = bst.predict(ddata, pred_leaf=True)  # [N, num_trees]

    N, T = leaf_indices.shape
    bin_counts = []
    for j in range(T):
        max_leaf_id = int(np.max(leaf_indices[:, j]))
        bin_counts.append(max_leaf_id + 1)

    graph.ndata['binned_feature'] = torch.tensor(leaf_indices, dtype=torch.long)
    graph.ndata['label'] = graph.ndata['label'].float()
    return graph, bst, bin_counts
