model: GuoxinChen/ReForm-32B
api: vllm
temperature: 1.0
max_tokens: 32768
top_p: 0.95
max_model_len: 32768
read_cost: 0
write_cost: 0
n_gpus: 4
node: 1
base_output_template: qwen
effective_parameters: 32
