device: 'cuda'
log_to_tensorboard: True
num_steps_per_iter: 10000
max_iters: 10
num_eval_episodes: 32
warmup_steps: 10000
weight_decay: 0.0001
learning_rate: 0.0001
save_model: True



