import os
import json

all_type = []
def flatten_list(nested_list):
    flat_list = []
    for item in nested_list:
        if isinstance(item, list):
            flat_list.extend(flatten_list(item))  # 递归处理嵌套列表
        else:
            flat_list.append(item)
    return flat_list


def extract_expression_types(expression, types):
    if expression:
        types.append(expression.get('type'))
        return extract_expression_types(expression.get('expression'), types)


def process_json_file(input_filepath, output_filepath, y):
    global all_type
    with open(input_filepath, 'r', encoding='utf-8') as f:
        input_json = json.load(f)

    input_json_children = input_json['children']
    if len(input_json_children) == 1:
        children = input_json_children[0]
    else:
        children = input_json['children'][1]

    # contract = {
    #     'name': children['name'],
    #     'type': children['type'],
    #     'kind': children['kind'],
    #     'subnode_num': len(children['subNodes']),
    #     'sub_node_info': [],
    #     'sub_node_visibility': []
    # }
    contract = {
        'name': children.get('name', 0),
        'type': children.get('type', 0),
        'kind': children.get('kind', 0),
        'subnode_num': len(children.get('subNodes', [])),
        'sub_node_info': [],
        'sub_node_visibility': [],
        "y": y
    }

    # all_type.extend(children['type'])
    # all_type.extend(children['kind'])
    if 'type' in children:
        all_type .append(str(children['type']))
        print("children['type'],", children['type'])

    if 'kind' in children:
        all_type .append(str(children['kind']))
        print("children['kind']", children['kind'])

    if 'subNodes' in children and children['subNodes'] is not None:
        for node in children['subNodes']:
            sub_node = {
                "node_is_function": 0,
                "node_parameters": 0,
                "node_return_parameters": 0,
                "node_is_constructor": 0,
                "node_is_variable": 0,
                "node_variable_has_number": 0,
                'sub_body_type': [],
                'node_type': node['type']
            }

            # if 'variables' in node:
            #     sub_node['node_body_type'] = node['variables'][0]['type']
            #     sub_node['node_is_variable'] = 1
            #     if 'visibility' in node['variables'][0]:
            #         contract['sub_node_visibility'].append(node['variables'][0]['visibility'])
            #     if ('expression' in node['variables'][0]) and (node['variables'][0]['expression'] is not None) and (
            #             'number' in node['variables'][0]['expression']):
            #         sub_node['node_variable_has_number'] = 1
            # else:
            #     sub_node['node_body_type'] = node['body']['type']
            #     sub_node['node_is_function'] = 1
            if 'variables' in node:
                if len(node['variables']) > 0:  # Check if 'variables' list is not empty
                    sub_node['node_body_type'] = node['variables'][0]['type']
                    sub_node['node_is_variable'] = 1
                    if 'visibility' in node['variables'][0]:
                        contract['sub_node_visibility'].append(node['variables'][0]['visibility'])
                    if 'expression' in node['variables'][0] and node['variables'][0]['expression'] is not None:
                        if 'number' in node['variables'][0]['expression']:
                            sub_node['node_variable_has_number'] = 1
            else:
                if 'body' in node and node['body'] is not None and 'type' in node['body']:
                    sub_node['node_body_type'] = node['body']['type']
                    sub_node['node_is_function'] = 1

            if 'parameters' in node and node['parameters'] is not None:
                sub_node['node_parameters'] = 1

            if 'returnParameters' in node and node['returnParameters'] is not None:
                sub_node['node_return_parameters'] = 1

            if 'isConstructor' in node and node['isConstructor'] is not None:
                sub_node['node_is_constructor'] = 1

            # if 'body' in node and 'statements' in node['body']:
            #     sub_body = node['body']['statements'][0]
            #     sub_node['sub_body_type'].append(sub_body['type'])
            #     extract_expression_types(sub_body.get('expression'), sub_node['sub_body_type'])

            if 'body' in node and node['body'] is not None and 'statements' in node['body']:
                statements = node['body']['statements']
                if len(statements) > 0:
                    sub_body = statements[0]
                    sub_node['sub_body_type'].append(sub_body['type'])
                    if 'expression' in sub_body:
                        extract_expression_types(sub_body['expression'], sub_node['sub_body_type'])

            contract['sub_node_info'].append(sub_node)

            if len(sub_node['node_type']) > 0:
                all_type .append(sub_node['node_type'])
            if len(contract['sub_node_info']) > 0:
                all_type .append(sub_node['sub_body_type'])

            print("sub_node['node_type'],", sub_node['node_type'])
            print("sub_node['sub_body_type']", sub_node['sub_body_type'])

        if not os.path.exists(output_filepath):
            with open(output_filepath, 'w', encoding='utf-8') as f:
                json.dump(contract, f, ensure_ascii=False)


def process_all_json_files(input_directory, output_directory):
    if not os.path.exists(output_directory):
        os.makedirs(output_directory)

    for filename in os.listdir(input_directory):
        if filename.endswith('.json'):
            input_filepath = os.path.join(input_directory, filename)
            output_filepath = os.path.join(output_directory, filename)
            if 299 <= int(filename[:-5]) and int(filename[:-5]) <= 1060:
                y = 1
            else:
                y = 0
            process_json_file(input_filepath, output_filepath, y)


# Specify the input and output directories
input_directory = r'E:\2024\experiment_code_clone\total4\source_code_no_comments\ast'
output_directory = r'E:\2024\experiment_code_clone\total4\source_code_no_comments\processed_ast'
feature_folder = r'E:\2024\experiment_code_clone\total4\source_code_no_comments\ast2features'

# Process all JSON files
process_all_json_files(input_directory, output_directory)

# flattened_list=all_type
flattened_list = flatten_list(all_type)
flattened_list=list(set(flattened_list))

with open(os.path.join(feature_folder, 'all_type.json'), 'w', encoding='utf-8') as f:
    json.dump(flattened_list, f, ensure_ascii=False)
