from datasets import load_dataset, concatenate_datasets dataset1 = load_dataset("qihoo360/ght-R1-SFTData")["train"] dataset2 = load_dataset("-dev/openthoughts_114k_thinkprompt")["train"] combined = concatenate_datasets([dataset1, dataset2]) combined = combined.shuffle(seed=42) combined.push_to_hub("-dev/openthoughts_plus_ght-R1-SFTData") 