data_pruning: True 
data_preserved_ratio: 0.2 

n_epochs: 200 
batch_size: 128 

forward_lr: 0.001
forward_lr_decay: 0.98 

weight_lr: 0.0005
weight_lr_decay: 0.99 
gradient_alpha: 0.12