# SmolLM2 (or any GGUF model) via llama-cpp-python — CPU-friendly
# Requires: pip install llama-cpp-python
# Download a GGUF from HuggingFace, e.g.:
#   huggingface-cli download HuggingFaceTB/SmolLM2-1.7B-Instruct-GGUF \
#       smollm2-1.7b-instruct-q4_k_m.gguf --local-dir models/
name: SmolLM2-1.7B-llamacpp

task:
  nbr_latents: 3
  nbr_distractors: 0
  vocab_size: 6
  max_sentence_length: 3
  min_nbr_values_per_latent: 2
  max_nbr_values_per_latent: 5
  nbr_communication_rounds: 1
  descriptive: true
  provide_listener_feedback: true

backend:
  backend_type: llamacpp
  model_path: models/smollm2-1.7b-instruct-q4_k_m.gguf
  n_ctx: 131072
  n_gpu_layers: 0    # set >0 to offload layers to GPU
  temperature: 0.7
  max_tokens: 256
  verbose: false
