from datasets import load_dataset ds = load_dataset("-dev/openthoughts3_100k", spt="train") code_ds = ds.filter(lambda x: x["_domain"] == "code") code_ds = code_ds.push_to_hub("-dev/openthoughts3_100k_code_only_20k", spt="train")