import json

# 读取 JSON 文件
train_file = './external_call/train.json'
with open(train_file, 'r') as f:
    data = json.load(f)

# 用于存储保留下来的智能合约数据
filtered_data = []

# 遍历每个智能合约的数据
for contract_data in data:
    # 获取 graph 数据
    graph = contract_data['graph']

    # 计算每个子元素的第一个和第三个最大值 len_graph
    len_graph = [max(subgraph[0], subgraph[2]) for subgraph in graph]
    max_len = max(len_graph)

    # 检查 node_features
    node_features = contract_data['node_features']
    cleaned_node_features = []
    cleaned_graph_features = []
    for feature in node_features:
        # 如果该子元素中的元素全为0，则跳过
        if not all(x == 0 for x in feature):
            cleaned_node_features.append(feature)
    for feature in graph:
        cleaned_graph_features.append(feature)
    len_node_features = len(cleaned_node_features)

    diff = max_len - len_node_features + 1
    if diff > 0:
        for _ in range(diff):
            cleaned_node_features.append([0] * 64)
    elif diff < 0:
        diff = abs(diff)
        for _ in range(diff):
            cleaned_graph_features.append([0] * 3)

    new_max = [max(subgraph[0], subgraph[2]) for subgraph in cleaned_graph_features]
    new_node_featuers=len(cleaned_graph_features)
    new_diff= new_max - new_node_featuers + 1

    if new_diff>0:
        for _ in range(diff):
            cleaned_node_features.append([0] * 64)
    elif diff < 0:
        diff = abs(diff)
        for _ in range(diff):
            cleaned_graph_features.append([0] * 3)

    contract_data['node_features'] = cleaned_node_features
    contract_data['graph'] = cleaned_graph_features

    filtered_data.append(contract_data)

# 将处理后的数据写回 JSON 文件
with open(train_file, 'w') as m:
    m.write('[')
    for idx, data in enumerate(filtered_data):
        json.dump(data, m)
        if idx < len(filtered_data) - 1:
            m.write(',\n')  # Add a comma and newline after writing each item
    # m.write(',\n')
    m.write(']')
