{
  "timestamp": "2025-09-14T21:53:11.673490",
  "benchmark_size": 10,
  "prompt_type": "direct_answer",
  "models_evaluated": [
    "huggingface/Qwen/Qwen3-0.6B"
  ],
  "results_summary": {
    "huggingface/Qwen/Qwen3-0.6B": {
      "accuracy": 0.0,
      "avg_response_time": 0.4475364923477173,
      "results_by_operation": {
        "addition": {
          "total": 3,
          "correct": 0,
          "accuracy": 0.0,
          "avg_response_time": 0.2432378133138021
        },
        "subtraction": {
          "total": 4,
          "correct": 0,
          "accuracy": 0.0,
          "avg_response_time": 0.6541732549667358
        },
        "exponentiation": {
          "total": 1,
          "correct": 0,
          "accuracy": 0.0,
          "avg_response_time": 0.7674651145935059
        },
        "logarithm": {
          "total": 2,
          "correct": 0,
          "accuracy": 0.0,
          "avg_response_time": 0.1807466745376587
        }
      },
      "results_by_difficulty": {
        "easy": {
          "total": 1,
          "correct": 0,
          "accuracy": 0.0,
          "avg_response_time": 0.20609593391418457
        },
        "medium": {
          "total": 3,
          "correct": 0,
          "accuracy": 0.0,
          "avg_response_time": 0.25335693359375
        },
        "hard": {
          "total": 6,
          "correct": 0,
          "accuracy": 0.0,
          "avg_response_time": 0.5848663647969564
        }
      },
      "metadata": {
        "prompt_type": "direct_answer",
        "prompt_description": "Direct numerical answer only"
      }
    }
  }
}