<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<title>Counterfactual Prompt Controls</title>
<style>
  html, body { margin: 0; padding: 0; overflow: hidden; width: 100%; height: 100%; font-family: 'Georgia', serif; background: #fafafa; }
  svg { display: block; width: 100%; height: 100%; }
  .tooltip { position: absolute; background: rgba(255,255,255,0.96); border: 1px solid #ccc; border-radius: 6px; padding: 10px 14px; font-size: 13px; line-height: 1.5; pointer-events: none; box-shadow: 0 2px 8px rgba(0,0,0,0.12); max-width: 280px; }
  .controls { position: absolute; top: 12px; left: 50%; transform: translateX(-50%); display: flex; gap: 8px; z-index: 10; }
  .btn { padding: 5px 12px; border: 2px solid #ddd; border-radius: 16px; background: #fff; font-size: 11px; font-weight: 600; cursor: pointer; transition: all 0.2s; font-family: 'Georgia', serif; }
  .btn.active { border-color: #333; background: #333; color: #fff; }
  .btn:hover { border-color: #666; }
</style>
</head>
<body>
<div class="controls">
  <button class="btn active" data-view="accuracy">Accuracy</button>
  <button class="btn" data-view="flips">C→I Flips</button>
</div>
<div class="tooltip" id="tip" style="display:none;"></div>
<svg id="chart"></svg>
<script src="https://d3js.org/d3.v7.min.js"></script>
<script>
const models = [
  { name: "Qwen2.5-7B", zs: 18.3, cot: 75.4, brief: 71.4, verify: 67.0, cotFlips: 39, briefFlips: 35, verifyFlips: 35, verifySaves: 28 },
  { name: "Llama-3.1-8B", zs: 14.6, cot: 23.4, brief: 29.5, verify: 13.9, cotFlips: 131, briefFlips: 106, verifyFlips: 122, verifySaves: 48 },
  { name: "Llama-2-7B", zs: 4.2, cot: 15.5, brief: 19.3, verify: 9.9, cotFlips: 46, briefFlips: 38, verifyFlips: 42, verifySaves: 11 },
  { name: "Mistral-7B", zs: 4.5, cot: 7.2, brief: 13.4, verify: 0.9, cotFlips: 52, briefFlips: 33, verifyFlips: 56, verifySaves: 1 }
];

const conditions = [
  { key: "zs", label: "Zero-Shot", color: "#999", desc: "Direct answer, no reasoning" },
  { key: "cot", label: "CoT", color: "#4e79a7", desc: "Full step-by-step with #### format" },
  { key: "brief", label: "Brief", color: "#e15759", desc: '"Think briefly, then answer"' },
  { key: "verify", label: "Verify", color: "#f28e2b", desc: '"The answer might be X. Verify step by step."' }
];

const svg = d3.select("#chart");
const tip = d3.select("#tip");
let viewMode = "accuracy";

document.querySelectorAll(".btn").forEach(btn => {
  btn.addEventListener("click", () => {
    document.querySelectorAll(".btn").forEach(b => b.classList.remove("active"));
    btn.classList.add("active");
    viewMode = btn.dataset.view;
    draw();
  });
});

function draw() {
  const W = window.innerWidth, H = window.innerHeight;
  const m = { top: 50, right: 20, bottom: 70, left: 55 };
  const w = W - m.left - m.right, h = H - m.top - m.bottom;
  svg.selectAll("*").remove();
  const g = svg.append("g").attr("transform", `translate(${m.left},${m.top})`);

  const x0 = d3.scaleBand().domain(models.map(d=>d.name)).range([0, w]).padding(0.2);
  const x1 = d3.scaleBand().domain(conditions.map(c=>c.key)).range([0, x0.bandwidth()]).padding(0.08);

  if (viewMode === "accuracy") {
    const y = d3.scaleLinear().domain([0, 82]).range([h, 0]);
    g.append("g").attr("transform",`translate(0,${h})`).call(d3.axisBottom(x0)).selectAll("text").attr("font-size","11px");
    g.append("g").call(d3.axisLeft(y).ticks(6).tickFormat(d=>d+"%"));
    g.append("text").attr("transform","rotate(-90)").attr("x",-h/2).attr("y",-40).attr("text-anchor","middle").attr("font-size","13px").attr("fill","#333").attr("font-weight",600).text("Accuracy (%)");

    models.forEach(mod => {
      conditions.forEach(cond => {
        const val = mod[cond.key];
        g.append("rect")
          .attr("x", x0(mod.name) + x1(cond.key))
          .attr("y", y(val)).attr("width", x1.bandwidth()).attr("height", y(0)-y(val))
          .attr("fill", cond.color).attr("rx", 2)
          .style("cursor","pointer")
          .on("mouseover", e => {
            tip.style("display","block").html(
              `<b>${mod.name}</b><br>
               <b style="color:${cond.color}">● ${cond.label}</b>: ${val.toFixed(1)}%<br>
               <i>${cond.desc}</i>`
            );
          })
          .on("mousemove", e => { tip.style("left",(e.pageX+12)+"px").style("top",(e.pageY-10)+"px"); })
          .on("mouseout", () => tip.style("display","none"));

        if (val > 3) {
          g.append("text")
            .attr("x", x0(mod.name) + x1(cond.key) + x1.bandwidth()/2)
            .attr("y", y(val) - 4)
            .attr("text-anchor","middle").attr("font-size","10px").attr("fill","#333").attr("font-weight",600)
            .attr("pointer-events","none")
            .text(val.toFixed(1));
        }
      });
    });
  } else {
    // Flips view
    const flipConds = [
      { key: "cotFlips", label: "CoT Flips", color: "#4e79a7" },
      { key: "briefFlips", label: "Brief Flips", color: "#e15759" },
      { key: "verifySaves", label: "Verify Saves", color: "#59a14f" }
    ];
    const maxFlip = d3.max(models, d => Math.max(d.cotFlips, d.briefFlips));
    const y = d3.scaleLinear().domain([0, maxFlip * 1.1]).range([h, 0]);
    const x1f = d3.scaleBand().domain(flipConds.map(c=>c.key)).range([0, x0.bandwidth()]).padding(0.08);

    g.append("g").attr("transform",`translate(0,${h})`).call(d3.axisBottom(x0)).selectAll("text").attr("font-size","11px");
    g.append("g").call(d3.axisLeft(y).ticks(6));
    g.append("text").attr("transform","rotate(-90)").attr("x",-h/2).attr("y",-40).attr("text-anchor","middle").attr("font-size","13px").attr("fill","#333").attr("font-weight",600).text("Count");

    models.forEach(mod => {
      flipConds.forEach(cond => {
        const val = mod[cond.key];
        g.append("rect")
          .attr("x", x0(mod.name) + x1f(cond.key))
          .attr("y", y(val)).attr("width", x1f.bandwidth()).attr("height", y(0)-y(val))
          .attr("fill", cond.color).attr("rx", 2)
          .style("cursor","pointer")
          .on("mouseover", e => {
            const extra = cond.key === "verifySaves" ? `<br>Save rate: ${mod.cotFlips>0?(val/mod.cotFlips*100).toFixed(0):'0'}%` : '';
            tip.style("display","block").html(`<b>${mod.name}</b><br><b style="color:${cond.color}">● ${cond.label}</b>: ${val}${extra}`);
          })
          .on("mousemove", e => { tip.style("left",(e.pageX+12)+"px").style("top",(e.pageY-10)+"px"); })
          .on("mouseout", () => tip.style("display","none"));

        g.append("text")
          .attr("x", x0(mod.name) + x1f(cond.key) + x1f.bandwidth()/2)
          .attr("y", y(val) - 4)
          .attr("text-anchor","middle").attr("font-size","10px").attr("fill","#333").attr("font-weight",600)
          .attr("pointer-events","none").text(val);
      });
    });
  }

  // Legend
  const legendData = viewMode === "accuracy" ? conditions :
    [{ key:"cotFlips", label:"CoT C→I Flips", color:"#4e79a7" }, { key:"briefFlips", label:"Brief C→I Flips", color:"#e15759" }, { key:"verifySaves", label:"Verify Saves", color:"#59a14f" }];
  const legendY = h + 35;
  const spacing = w / legendData.length;
  legendData.forEach((c, i) => {
    g.append("rect").attr("x", i*spacing+5).attr("y", legendY).attr("width",12).attr("height",12).attr("fill",c.color).attr("rx",2);
    g.append("text").attr("x", i*spacing+20).attr("y", legendY+10).attr("font-size","11px").attr("fill","#555").text(c.label);
  });
}

draw();
window.addEventListener("resize", draw);
</script>
</body>
</html>
