[tool.poetry]
name = "judges-verdict"
version = "0.1.0"
description = "Judge's Verdict: A comprehensive system for evaluating Large Language Models as judges"
readme = "README.md"
packages = [{include = "llm_judge_benchmark"}]

[tool.poetry.dependencies]
python = ">=3.12,<4.0"
pandas = "~2.3.2"
datasets = "~4.0.0"
tqdm = "~4.67.1"
ragas = "~0.3.3"
langchain_nvidia_ai_endpoints = "~0.3.17"
langchain_openai = "~0.3.32"
litellm = "~1.76.2"
pyyaml = "~6.0.2"

[tool.poetry.group.dev.dependencies]
pytest = "~8.4.2"
flake8 = "~7.3.0"
isort = "~6.0.1"
black = "~25.1.0"
mypy = "~1.17.1"
pytest-cov = "~6.2.1"
types-pyyaml = "~6.0.12.20250822"

[tool.poetry.scripts]
llm-judge-score = "llm_judge_benchmark.scoring.llm_judge_scoring:main"

[build-system]
requires = ["poetry-core"]
build-backend = "poetry.core.masonry.api"

[tool.black]
line-length = 120
target_version = ["py312"]
exclude = "(.eggs|.git|.hg|.mypy_cache|.nox|.tox|venv|doc-venv|.svn|_build|buck-out|build|dist|notebooks|tools|tmp|bundles)"

[tool.isort]
multi_line_output = 3
include_trailing_comma = true
force_grid_wrap = 0
use_parentheses = true
ensure_newline_before_comments = true
line_length = 120

[tool.mypy]
ignore_missing_imports = true
allow_redefinition = true
strict_optional = false
exclude = "(.eggs|.git|.hg|.mypy_cache|.nox|.tox|venv|doc-venv|.svn|_build|buck-out|build|dist|notebooks|tools|tmp|tests|bundles)"
