repre_layer_sizes : [200,200,200]
bn : True
optimizer : adam
learning_rate : 0.001
pretrain_ratio: 0.8
policy_K_for_train: 2