0	Namespace(device='0', env='BO', training_episode=1001, T=100, domain_size=1000, f_num=2, hidden_size=128, lr=1e-05, new_lr=-1, n_batch=1, weight_decay=1e-05, update_freq=1, target_update_freq=5, batch_size=8, n_layer=4, n_head=4, n_positions=31, warmup_steps=1, gamma=0.95, seed=1, function_type='train', model_episode=0, optimizer='adam', dropout=0.1, epsilon=0.1, sample_rate=0.005, demo_rate=0.01, buffer_size=64, new_reward=1)
1	Namespace(device='0', env='BO', training_episode=1001, T=100, domain_size=1000, f_num=3, hidden_size=128, lr=1e-05, new_lr=-1, n_batch=1, weight_decay=1e-05, update_freq=1, target_update_freq=5, batch_size=8, n_layer=4, n_head=4, n_positions=31, warmup_steps=1, gamma=0.95, seed=1, function_type='train', model_episode=0, optimizer='adam', dropout=0.1, epsilon=0.1, sample_rate=0.005, demo_rate=0.01, buffer_size=64, new_reward=1)
2	Namespace(device='3', env='BO', training_episode=2001, T=100, domain_size=1000, f_num=2, hidden_size=128, lr=1e-05, n_batch=1, weight_decay=1e-05, update_freq=1, target_update_freq=5, batch_size=8, n_layer=4, n_head=4, n_positions=301, warmup_steps=1, gamma=0.95, seed=1, function_type='train', model_episode=0, optimizer='adam', dropout=0.1, epsilon=0.1, sample_rate=0.005, demo_rate=0.01, buffer_size=64, new_reward=1, noise_level=0.1, update_step=10, initial_sample=1)
3	Namespace(device='0', env='BO', training_episode=2001, T=100, domain_size=1000, f_num=3, hidden_size=128, lr=1e-05, n_batch=1, weight_decay=1e-05, update_freq=1, target_update_freq=5, batch_size=8, n_layer=4, n_head=4, n_positions=91, warmup_steps=1, gamma=0.95, seed=1, function_type='train', model_episode=0, optimizer='adam', dropout=0.1, epsilon=0.1, sample_rate=0.005, demo_rate=0.01, buffer_size=64, new_reward=1, noise_level=0.1, update_step=10, initial_sample=1)
