smiles_file: "./clean_smiles.h5" #Populate with a npy file of SMILES strings encoded in byte string form, e.g. np.array([b'CCO', b'CCN', ...])
target_file: "./clean_targets.h5" #Populate with an h5 file that has a key 'targets' which contains a numpy array of shape (n,) for n scalar targets
input_generator: "SMILESInputBasic"
input_generator_addn_args: {}
target_generator: "ScalarTarget"
target_generator_addn_args: {}
output_file: "./toxicity_dset.h5"
alphabet: null
num_processes: 16
