import outlines
model_path = '/data/home/zhanghx/model/lora_model_answer'
from outlines import models, generate, samplers

outlines_model = outlines.models.transformers(model_path, device="cuda:0")
# for name, param in outlines_model.model.named_parameters():
#     print(f"Layer: {name} | Mean: {param.mean().item()}")
    

input_text = "how are you?"
text = f'''Below is an input may be from pre-training corpus. if the input is seen in the pre-training step, the answer is "Yes", otherwise, it is "No". Please provide an answer. 

### Input:
{input_text}
'''
sampler = samplers.multinomial(1, temperature=1e-10)
generator = outlines.generate.text(outlines_model, sampler)

# generator = outlines.generate.choice(outlines_model, ["Yes", "No"])
answer = generator(text, max_tokens=350)
print(answer)



