Expert(Sto) Return Avg: 5282.87, std: 61.55
array([5261.126, 5220.272, 5369.898, 5265.225, 5345.264, 5299.185,
       5263.83 , 5282.481, 5339.214, 5229.632, 5254.6  , 5268.923,
       5260.497, 5412.119, 5141.294, 5326.029, 5149.482, 5345.089,
       5377.8  , 5283.117, 5282.514, 5300.918, 5329.301, 5330.37 ,
       5306.1  , 5208.902, 5265.598, 5364.134, 5244.984, 5260.738,
       5263.193, 5235.041, 5346.142, 5313.363, 5274.433, 5208.766,
       5196.669, 5187.763, 5299.936, 5367.852, 5332.699, 5287.605,
       5265.647, 5325.082, 5373.766, 5324.203, 5351.685, 5282.84 ,
       5378.598, 5323.029, 5190.351, 5297.805, 5283.88 , 5352.085,
       5143.822, 5287.518, 5215.844, 5174.678, 5228.075, 5327.414,
       5284.936, 5284.466, 5197.341, 5308.467])
Expert(Det) Return Avg: 5363.57, std: 20.40
array([5340.267, 5387.999, 5358.028, 5391.539, 5348.315, 5363.486,
       5404.907, 5370.395, 5361.01 , 5367.414, 5421.749, 5383.293,
       5387.888, 5381.33 , 5355.675, 5369.748, 5325.229, 5380.246,
       5345.327, 5359.53 , 5339.488, 5372.874, 5364.594, 5355.034,
       5389.343, 5381.065, 5381.276, 5384.112, 5364.693, 5309.454,
       5389.588, 5340.07 , 5383.136, 5356.044, 5371.805, 5350.596,
       5365.128, 5358.02 , 5384.953, 5374.71 , 5355.334, 5346.256,
       5361.66 , 5374.906, 5355.252, 5360.674, 5349.86 , 5356.463,
       5380.413, 5374.634, 5354.81 , 5343.651, 5355.194, 5357.311,
       5355.223, 5325.203, 5371.777, 5359.081, 5347.788, 5363.838,
       5325.75 , 5325.392, 5351.245, 5397.708])
ordereddict([('seed', 666), ('cuda', -1), ('env', ordereddict([('env_name', 'Walker2dFH-v0'), ('T', 1000)])), ('sac', ordereddict([('epochs', 3000), ('log_step_interval', 5000), ('update_every', 50), ('update_num', 1), ('random_explore_episodes', 10), ('batch_size', 100), ('lr', 0.001), ('alpha', 0.2), ('automatic_alpha_tuning', False), ('buffer_size', 1000000), ('num_test_episodes', 10)])), ('expert', ordereddict([('samples_episode', 64)])), ('launching_env', 'walker2d'), ('_hidden_keys', []), ('exp_cnt', 1), ('exp_name', '7-16-sac-samples_2020_07_16_20_24_30_0002')])