framework: "huggingface"


device: "cuda"
mode: "AutoModelForCausalLM"
model:
  name: "replit/replit-code-v1-3b"
  trust_remote_code: true
tokenizer:
  trust_remote_code: true

batch_size: 20
skip_special_tokens: true

# Parameters for GenerationConfig
# Please do check the documentation: c.f. https://huggingface.co/docs/transformers/main/en/main_classes/text_generation#transformers.GenerationConfig
params:
  max_new_tokens: 128
  early_stopping: true
  num_beams: 3
  temperature: 1.0
  top_p: 1.0
  top_k: 50
  num_return_sequences: 1
