save_path: "lamini_instruction"
dataset: "MBZUAI/LaMini-instruction"
shard_size: 100000000
max_length: 512
num_tokens: 10
condition_column: "instruction"
target_column: "response"
split: "train"