import numpy as np
from transformers import AutoTokenizer
tokenizer = AutoTokenizer.from_pretrained("facebook/opt-125m")
import tqdm

output = np.load('opt_2000.npy')
test = []
for ind in tqdm.tqdm(range(40960000)):
    try:
        text = tokenizer.decode(output[ind])
        test.append(text)
    except:
        print(ind)
        continue

with open('opt_2000.txt','w') as f:
    for txt in tqdm.tqdm(test):
        f.write(txt + '\n')
        f.write('\n')