import os
import subprocess


def run_extraction(input_dir, output_dir, vocab_file, bert_config_file, init_checkpoint, layers, max_seq_length,
                   batch_size, use_gpu):
    # 确保输出目录存在
    if not os.path.exists(output_dir):
        os.makedirs(output_dir)

    # 遍历input_dir中的所有文件
    for filename in os.listdir(input_dir):
        # if filename.endswith(".txt"):  # 确保处理.txt文件
        if filename != "all.txt":
            input_file = os.path.join(input_dir, filename)
            output_file = os.path.join(output_dir, filename[:-4] + ".json")

            if os.path.exists(output_file):
                continue
            else:
                print("input file name is " + input_file)
                print("out put file is "+output_file)
                command = [
                    "python3", "extract_features.py",
                    "--input_file", input_file,
                    "--output_file", output_file,
                    "--vocab_file", vocab_file,
                    "--bert_config_file", bert_config_file,
                    "--init_checkpoint", init_checkpoint,
                    "--layers", str(layers),
                    "--max_seq_length", str(max_seq_length),
                    "--batch_size", str(batch_size),
                    "--use_gpu", str(use_gpu)
                ]

                # 执行命令
                print("Processing file:", filename)
                print("-----------------------------command: ", command)
                subprocess.run(command)


# 配置参数
input_dir = './feature/input/reentrancy'
output_dir = './feature/output/reentrancy'
vocab_file = './vocab.txt'
bert_config_file = './bert_config.json'
init_checkpoint = './models/finetune/tfrecord/reentrancy/model.ckpt-4812'
layers = -1
max_seq_length = 64
batch_size = 8
use_gpu = 'True'

# 运行函数
run_extraction(input_dir, output_dir, vocab_file, bert_config_file, init_checkpoint, layers, max_seq_length, batch_size,
               use_gpu)
