from wrapper import PENGIWrapper

pengi = PENGIWrapper(model_path="<model_path>")
generated_captions, scores = pengi.predict(audio_path="<audio_file_path>",
                                            tast_context="generate metadata", 
                                            context = "", 
                                            entry_length=30, 
                                            beam_size=3, 
                                            temperature=1.0, 
                                            stop_token=' <|endoftext|>')