{
  "file": "...",
  "per_item": [
    {
      "id": "76",
      "accuracy_string": 0,
      "accuracy_symbolic": 0,
      "f1_exact": {
        "precision": 0.0,
        "recall": 0.0,
        "f1": 0.0
      },
      "f1_semantic": {
        "precision": 0.3333333333333333,
        "recall": 0.6666666666666666,
        "f1": 0.4444444444444444,
        "sim_threshold": 0.7
      },
      "srs_components": {
        "faithfulness": 0.7152597109476725,
        "info_step": 0.6948292951868928,
        "info_chain": 0.9128024578094482,
        "repetition_step": 0.06451988220214844,
        "discourse": 0.6224352419376373,
        "coherence": 0.04519200325012207
      },
      "srs": 0.5091730985556536,
      "vr_score": 0.26389482617378235,
      "pred_answer": "0",
      "ref_answer_expr_used": "log((pi + 3*sqrt3)/(pi - 3*sqrt3))",
      "ref_steps_count": 3,
      "hyp_steps_count": 6
    },
    {
      "id": "239",
      "accuracy_string": 0,
      "accuracy_symbolic": 1,
      "f1_exact": {
        "precision": 0.0,
        "recall": 0.0,
        "f1": 0.0
      },
      "f1_semantic": {
        "precision": 0.6666666666666666,
        "recall": 1.0,
        "f1": 0.8,
        "sim_threshold": 0.7
      },
      "srs_components": {
        "faithfulness": 0.7426896095275879,
        "info_step": 0.6982916663400829,
        "info_chain": 0.9395443201065063,
        "repetition_step": 0.09631824493408203,
        "discourse": 0.726351410150528,
        "coherence": 0.762936145067215
      },
      "srs": 0.6610218993543336,
      "vr_score": 0.39624062180519104,
      "pred_answer": "\\ln |x + \\cos x| + C",
      "ref_answer_expr_used": "log(Abs(x+\\cos x))",
      "ref_steps_count": 2,
      "hyp_steps_count": 3
    }
  ],
  "aggregates": {
    "count": 2,
    "accuracy_string": 0.0,
    "accuracy_symbolic": 0.5,
    "f1_exact_precision": 0.0,
    "f1_exact_recall": 0.0,
    "f1_exact_f1": 0.0,
    "f1_semantic_precision": 0.5,
    "f1_semantic_recall": 0.8333333333333333,
    "f1_semantic_f1": 0.6222222222222222,
    "srs": 0.5850974989549936,
    "vr_score": 0.3300677239894867,
    "srs_faithfulness": 0.7289746602376301,
    "srs_info_step": 0.6965604807634879,
    "srs_info_chain": 0.9261733889579773,
    "srs_repetition_step": 0.08041906356811523,
    "srs_discourse": 0.6743933260440826,
    "srs_coherence": 0.4040640741586685
  }
}