[build-system]
requires = ["setuptools>=61", "wheel"]
build-backend = "setuptools.backends.legacy:build"

[project]
name = "meta-rg-s2b"
version = "0.1.0"
description = "Minimal reproduction of Section 4.4 (Table 4) from 'Meta-Referential Games to Learn Compositional Learning Behaviours'"
readme = "README.md"
requires-python = ">=3.10"
license = { text = "MIT" }

dependencies = [
    # S2B environment — install via: pip install -e path/to/SymbolicBehaviourBenchmark
    "symbolic-behaviour-benchmark",
    # RL / gym
    "gym>=0.21,<0.24",
    "numpy>=1.24",
    # HuggingFace stack (local HF and GRPO backends)
    "torch>=2.0",
    "transformers>=4.40",
    "accelerate>=0.27",
    "peft>=0.10",          # LoRA — required for GRPO training
    # Logging / tracking
    "tqdm",
    "wandb",
    "pyyaml",
]

[project.optional-dependencies]
cot    = ["dspy>=3.0"]
openai = ["openai>=1.0"]
vllm   = ["vllm>=0.4"]
llamacpp = ["llama-cpp-python>=0.2"]
bitsandbytes = ["bitsandbytes>=0.43"]   # 4-bit quantisation
weave  = ["weave"]                       # W&B Weave LLM call tracing
dev    = ["pytest>=7", "pytest-cov"]
all    = [
    "dspy>=3.0",
    "openai>=1.0",
    "vllm>=0.4",
    "llama-cpp-python>=0.2",
    "bitsandbytes>=0.43",
    "weave",
]

[tool.setuptools.packages.find]
where = ["."]
include = ["meta_rg*"]

[tool.pytest.ini_options]
testpaths = ["tests"]
markers = [
    "integration: tests that hit external APIs (require HF_TOKEN or similar credentials)",
]
