[
  {
    "label": "itrainingrecipeofscreasoner"
  },
  {
    "label": "a"
  },
  {
    "label": "annotate"
  },
  {
    "label": "iterativereasoningrationales"
  },
  {
    "label": "iterativereasoner"
  },
  {
    "label": "sft"
  },
  {
    "label": "subquesplanningdecomposition"
  },
  {
    "label": "iterativereasoning"
  },
  {
    "label": "activateretrieval"
  },
  {
    "label": "reasonermodules"
  },
  {
    "label": "finetune"
  },
  {
    "label": "inference"
  },
  {
    "label": "syntheticrationales"
  },
  {
    "label": "criticdata"
  },
  {
    "label": "sft"
  },
  {
    "label": "feedback"
  },
  {
    "label": "insightloop"
  },
  {
    "label": "retrievalquality"
  },
  {
    "label": "qwherewasthefilmthefamilystoneset"
  },
  {
    "label": "dthefamilystonethestonefamilyisa"
  },
  {
    "label": "relevant"
  },
  {
    "label": "partial"
  },
  {
    "label": "irrelevant"
  },
  {
    "label": "reasoningquality"
  },
  {
    "label": "qwherewasthefilmthefamilystoneset"
  },
  {
    "label": "dthefamilystonethestonefamilyisa"
  },
  {
    "label": "useful"
  },
  {
    "label": "partial"
  },
  {
    "label": "useless"
  },
  {
    "label": "overallquality"
  },
  {
    "label": "evaluatethewholereasoningtrajectory"
  },
  {
    "label": "1"
  },
  {
    "label": "2"
  },
  {
    "label": "3"
  },
  {
    "label": "4"
  },
  {
    "label": "5"
  },
  {
    "label": "6"
  },
  {
    "label": "7"
  },
  {
    "label": "criticmodel"
  }
]