from datasets import load_dataset # repos = { # "detailed thinking on": "/Llama-3.1-Nemotron-Nano-8B-v1_1743011149_eval_0981", # "detailed thinking off": "/Llama-3.1-Nemotron-Nano-8B-v1_1743011943_eval_0981", # "NONE": "/Llama-3.1-Nemotron-Nano-8B-v1_1743012005_eval_0981" # } repos = {  "detailed thinking on": "/qwen2-5_nemotron-sft_100000_1743011928_eval_0981",  "detailed thinking off": "/qwen2-5_nemotron-sft_100000_1743018696_eval_0981",  "NONE": "/qwen2-5_nemotron-sft_100000_1743001432_eval_0981", } for system, repo in repos.items():  ds = load_dataset(repo, spt="train")  total = len(ds)  ds = ds.filter(lambda x: x["model_outputs"].startswith("<think>"))  thinking = len(ds)  print(f"{system}: {thinking} / {total} starts with <think>") 