import os from datasets import concatenate_datasets, load_dataset datasets = [] def map_to_sharegpt(x):  x["conversations"] = [  {"from": "user", "value": x["problem"]},  {  "from": "assistant",  "value": f"<think>\n\n{x['deepseek_reasoning']}\n\n</think>\n\n{x['deepseek_solution']}",  },  ]  return x ds = load_dataset("open-thoughts/Open-Thoughts-114k", "metadata", spt="train") ds = ds.map(map_to_sharegpt, num_proc=os.cpu_count()) ds = ds.select_columns(["conversations"]) datasets.append(ds) ds = load_dataset(  "-dev/OpenR1-Math-Raw-all-correct-sharegpt", spt="train" ) datasets.append(ds) # Combine into final mix combined = concatenate_datasets(datasets) combined.push_to_hub("-dev/ot-114k_Math-Raw-all-correct") 