datasets==3.3.2
Evaluation==0.0.2
langchain==0.3.26
langchain_core==0.3.69
langchain_openai==0.3.28
numpy==2.3.1
pydantic==2.11.7
ragas==0.2.15
rouge_score==0.1.2
