_target_: llmplus.GenerationConfig
n: 1
# temperature: 0.3
temperature: 1.0
# apparently temperature can only be 1 when thinking is enabled
max_tokens: 32000
top_p: 1
batch_size: 8
seed: 88
ignore_cache: false
extra_kwargs:
  extra_body: {"thinking": {"type": "enabled", "budget_tokens": 16000}}

# gen_cfg = GenerationConfig(
#     n=2,
#     temperature=1.0,
#     # max_tokens must be > thinking budget_tokens
#     max_tokens=1124,
#     extra_kwargs={
#         "extra_body": {
#             "thinking": {
#                 "type": "enabled",
#                 # apparently the min value for this is 1024
#                 "budget_tokens": 1024,
#             }
#         }
#     },
# )

