
import pandas as pd
import json
import numpy as np
from omegaconf import OmegaConf, DictConfig
import os
import yaml
from template_bash import bash_heads
from tqdm import tqdm
import glob
import shutil

df = pd.read_parquet('/path/to/data/csv')
captions = df['caption']
df_animal = df[~df['Animal'].isin(['None', None])]
vid_path = '/path/to/source/video/mp4'
frame_path = '/path/to/source/video/frames'

captions = list(df_animal['caption'])
prompts = list(df_animal['CE_animal'])
keys = list(df_animal['key'])
animals = list(df_animal['Animal'])
animals = [item.split(', ') for item in animals]
editing_entity = list(df_animal['CE_animal_editing_entity'])
video_files = [os.path.join(vid_path, f'{key}.mp4') for key in keys]
frame_files = [os.path.join(frame_path, key) for key in keys]
prompt_bashes = []

for i in range(len(video_files)):
    cur_bash = f"python -u inference.py --device $$$d$$$ --video_path {video_files[i]} --prompt '{prompts[i]}' --output_path 'results/{keys[i]}/{keys[i]}.mp4'"
    prompt_bashes.append(cur_bash)
devide_count = 2
total_len = len(prompt_bashes)
length_per_device = total_len // devide_count
run_string = bash_heads['text2video']

for i in range(devide_count):
    new_list = []
    start = i * length_per_device
    # 对最后一部分进行特别处理，将剩余的部分都留给最后一个device
    end = (i+1) * length_per_device if i != (devide_count-1) else total_len
    for j in range(start, end):
        # 在每个命令字符串后面添加相应的设备id
        new_list.append(prompt_bashes[j].replace('$$$d$$$', str(i)))
    with open(f'run_ce_animals_text2video_p{i}.sh', 'w') as s:
        s.write(run_string + '\n')
        s.write('\n\n'.join(new_list))
        s.close()