import sys
import best3 as b3
from constants import imdb_dir
import torch as th
import vllm
import polars as pl
if __name__ == '__main__':
    model = vllm.LLM("intfloat/e5-mistral-7b-instruct", task="embed")
    embed = []
    df = pl.DataFrame.deserialize('datasets/nf/alternatives.pl')
    for i in map(int, sys.argv[1:]):
        print('-------------------------------', i)
        print(df[df['movie'] == i])
        ip = imdb_dir / b3.movie_fn(i)
        with open(ip / "url.txt") as fd:
            print(fd.read())

        with open(ip / "imdb.html") as fd:
            inp = b3.format_imdb(fd.read())
        print(inp)
        embed.append(model.embed(inp)[0].outputs.embedding)
    embed = th.tensor(embed)