# Mixtral-8x7B-Instruct-v0.1 via vLLM (offline in-process)
# Faster than HF for large-scale evaluation.
# Requires: pip install vllm
# Matches Table 4, Mixtral row.
name: Mixtral-8x7B-vllm

task:
  nbr_latents: 3
  nbr_distractors: 0
  vocab_size: 6
  max_sentence_length: 3
  min_nbr_values_per_latent: 2
  max_nbr_values_per_latent: 5
  nbr_communication_rounds: 1
  descriptive: true
  provide_listener_feedback: true

backend:
  backend_type: vllm
  mode: offline
  model: mistralai/Mixtral-8x7B-Instruct-v0.1
  temperature: 0.7
  max_tokens: 256
  tensor_parallel_size: 1         # increase for multi-GPU
  gpu_memory_utilization: 0.90

# ── Alternatively, point at a running vLLM server ──────────────────────────────
# backend:
#   backend_type: vllm
#   mode: server
#   base_url: http://localhost:8000/v1
#   model: mistralai/Mixtral-8x7B-Instruct-v0.1
#   api_key: EMPTY
