batch_size: 256
gamma: 0.99
lr: 0.0003
##start_steps: 10000
start_steps: 1000
hidden_size: 256
tau: 0.005
alpha: 0.2
reward_scale: 5


