{"batch_size": 2048, "ds_path": "./datasets_v2/llama3_instruct-RTP_split-B11-block", "factor": 6, "k": 2048, "lr": 1e-05, "max_epochs": 100, "n_inputs": 4096, "activation": "topk-sigmoid"}