EPOCH=3
NUM_GPUS=8

BASE_MODEL=Qwen3-8B
MODEL_ORG="Qwen"
TRAIN_DATASET=qwen3-8B-vanilla-codegen

CHECK_POINT_ROOT_PATH="/path/to/home/checkpoints"
CONVERTED_CHECK_POINT_ROOT_PATH="/path/to/home/converted_checkpoint"

SYSTEM_PROMPT="You are a highly capable assistant. You will receive a problem statement enclosed in <problem></problem> tags and an input enclosed in <input></input> tags. Your task is to generate Python code from this information and predict the result produced when the code is executed with the given input. Wrap the generated code, your reasoning process, and the output in <code></code>, <think></think>, and <answer></answer> tags, respectively; i.e., <code> python code here </code> <think> reasoning process here </think><answer> output here </answer>."

if [ -f "$LATEST_ITERATION_FILE" ]; then
  ITERATION=$(cat "$LATEST_ITERATION_FILE")
else
  ITERATION=7500
fi

INFERENCE_MODEL_PATH="${MODEL_ORG}/${BASE_MODEL}"

USE_GUIDED_DECODING=false
