2023-07-07 00:04:44,500 -        meta learning: [    INFO] - [INFO] checkpoint saved to: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 00:04:44,500 -        meta learning: [    INFO] - [INFO] tensorboard dir set to: ./runs/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 00:04:44,500 -        meta learning: [    INFO] - [ARGS]: Namespace(policy='BatchedGruMetaStdpMLPPolicy', algo='PGPE', task='SeqTask', seq_length=20, latency=24, num_cls=5, feature_dims=14, sigma=0.1, batch_size=512, hidden_dims=[128], pop_size=256, center_lr=0.01, init_std=0.04, decay_std=0.999, limit_std=0.001, std_lr=0.07, terminate_when_unhealthy=False, max_iters=12000, num_tasks=1, seed=42, num_tests=128, eval_epoch=100, eval=False, eval_with_injury=False, resume='', save=False, repeat=20, root_dir='/data/anonymous/meta', tensorboard_dir='./runs', suffix='', output_dir='/data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444', summary_writer=<torch.utils.tensorboard.writer.SummaryWriter object at 0x7fbbe02e6d00>, tb_prefix='PGPE/SeqTask/BatchedGruMetaStdpMLPPolicy')
2023-07-07 00:04:47,772 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 00:04:47,835 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 00:04:55,556 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 100, best=0.73, avg=0.71, std=0.01, steps=4.137e+05
2023-07-07 00:04:59,529 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 200, best=0.79, avg=0.78, std=0.01, steps=8.233e+05
2023-07-07 00:05:03,447 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 300, best=0.88, avg=0.86, std=0.01, steps=1.233e+06
2023-07-07 00:05:07,369 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 400, best=0.92, avg=0.90, std=0.01, steps=1.642e+06
2023-07-07 00:05:11,315 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 500, best=0.96, avg=0.95, std=0.00, steps=2.052e+06
2023-07-07 00:05:15,262 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 600, best=0.98, avg=0.97, std=0.00, steps=2.462e+06
2023-07-07 00:05:19,216 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 700, best=1.00, avg=0.99, std=0.00, steps=2.871e+06
2023-07-07 00:05:23,180 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 800, best=1.00, avg=1.00, std=0.00, steps=3.281e+06
2023-07-07 00:05:27,170 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 900, best=1.00, avg=1.00, std=0.00, steps=3.690e+06
2023-07-07 00:05:31,132 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 1000, best=1.00, avg=1.00, std=0.00, steps=4.100e+06
2023-07-07 00:05:35,067 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 1100, best=1.00, avg=1.00, std=0.00, steps=4.510e+06
2023-07-07 00:05:38,999 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 1200, best=1.00, avg=1.00, std=0.00, steps=4.919e+06
2023-07-07 00:05:42,941 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 1300, best=1.00, avg=1.00, std=0.00, steps=5.329e+06
2023-07-07 00:05:46,888 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 1400, best=1.00, avg=1.00, std=0.00, steps=5.738e+06
2023-07-07 00:05:50,842 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 1500, best=1.00, avg=1.00, std=0.00, steps=6.148e+06
2023-07-07 00:05:54,767 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 1600, best=1.00, avg=1.00, std=0.00, steps=6.558e+06
2023-07-07 00:05:58,694 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 1700, best=1.00, avg=1.00, std=0.00, steps=6.967e+06
2023-07-07 00:06:02,616 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 1800, best=1.00, avg=1.00, std=0.00, steps=7.377e+06
2023-07-07 00:06:06,560 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 1900, best=1.00, avg=1.00, std=0.00, steps=7.786e+06
2023-07-07 00:06:10,516 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 2000, best=1.00, avg=1.00, std=0.00, steps=8.196e+06
2023-07-07 00:06:14,467 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 2100, best=1.00, avg=1.00, std=0.00, steps=8.606e+06
2023-07-07 00:06:18,427 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 2200, best=1.00, avg=1.00, std=0.00, steps=9.015e+06
2023-07-07 00:06:22,399 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 2300, best=1.00, avg=1.00, std=0.00, steps=9.425e+06
2023-07-07 00:06:26,361 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 2400, best=1.00, avg=1.00, std=0.00, steps=9.834e+06
2023-07-07 00:06:30,319 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 2500, best=1.00, avg=1.00, std=0.00, steps=1.024e+07
2023-07-07 00:06:34,268 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 2600, best=1.00, avg=1.00, std=0.00, steps=1.065e+07
2023-07-07 00:06:38,218 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 2700, best=1.00, avg=1.00, std=0.00, steps=1.106e+07
2023-07-07 00:06:42,182 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 2800, best=1.00, avg=1.00, std=0.00, steps=1.147e+07
2023-07-07 00:06:46,149 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 2900, best=1.00, avg=1.00, std=0.00, steps=1.188e+07
2023-07-07 00:06:50,111 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 3000, best=1.00, avg=1.00, std=0.00, steps=1.229e+07
2023-07-07 00:06:54,049 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 3100, best=1.00, avg=1.00, std=0.00, steps=1.270e+07
2023-07-07 00:06:57,986 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 3200, best=1.00, avg=1.00, std=0.00, steps=1.311e+07
2023-07-07 00:07:01,918 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 3300, best=1.00, avg=1.00, std=0.00, steps=1.352e+07
2023-07-07 00:07:05,846 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 3400, best=1.00, avg=1.00, std=0.00, steps=1.393e+07
2023-07-07 00:07:09,797 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 3500, best=1.00, avg=1.00, std=0.00, steps=1.434e+07
2023-07-07 00:07:13,748 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 3600, best=1.00, avg=1.00, std=0.00, steps=1.475e+07
2023-07-07 00:07:17,688 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 3700, best=1.00, avg=1.00, std=0.00, steps=1.516e+07
2023-07-07 00:07:21,616 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 3800, best=1.00, avg=1.00, std=0.00, steps=1.557e+07
2023-07-07 00:07:25,567 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 3900, best=1.00, avg=1.00, std=0.00, steps=1.598e+07
2023-07-07 00:07:29,519 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 4000, best=1.00, avg=1.00, std=0.00, steps=1.639e+07
2023-07-07 00:07:33,472 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 4100, best=1.00, avg=1.00, std=0.00, steps=1.680e+07
2023-07-07 00:07:37,428 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 4200, best=1.00, avg=1.00, std=0.00, steps=1.721e+07
2023-07-07 00:07:41,376 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 4300, best=1.00, avg=1.00, std=0.00, steps=1.762e+07
2023-07-07 00:07:45,325 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 4400, best=1.00, avg=1.00, std=0.00, steps=1.803e+07
2023-07-07 00:07:49,273 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 4500, best=1.00, avg=1.00, std=0.00, steps=1.844e+07
2023-07-07 00:07:53,209 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 4600, best=1.00, avg=1.00, std=0.00, steps=1.885e+07
2023-07-07 00:07:57,140 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 4700, best=1.00, avg=1.00, std=0.00, steps=1.926e+07
2023-07-07 00:08:01,082 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 4800, best=1.00, avg=1.00, std=0.00, steps=1.966e+07
2023-07-07 00:08:05,023 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 4900, best=1.00, avg=1.00, std=0.00, steps=2.007e+07
2023-07-07 00:08:08,966 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 5000, best=1.00, avg=1.00, std=0.00, steps=2.048e+07
2023-07-07 00:08:12,907 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 5100, best=1.00, avg=1.00, std=0.00, steps=2.089e+07
2023-07-07 00:08:16,853 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 5200, best=1.00, avg=1.00, std=0.00, steps=2.130e+07
2023-07-07 00:08:20,782 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 5300, best=1.00, avg=1.00, std=0.00, steps=2.171e+07
2023-07-07 00:08:24,734 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 5400, best=1.00, avg=1.00, std=0.00, steps=2.212e+07
2023-07-07 00:08:28,696 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 5500, best=1.00, avg=1.00, std=0.00, steps=2.253e+07
2023-07-07 00:08:32,672 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 5600, best=1.00, avg=1.00, std=0.00, steps=2.294e+07
2023-07-07 00:08:36,631 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 5700, best=1.00, avg=1.00, std=0.00, steps=2.335e+07
2023-07-07 00:08:40,588 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 5800, best=1.00, avg=1.00, std=0.00, steps=2.376e+07
2023-07-07 00:08:44,523 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 5900, best=1.00, avg=1.00, std=0.00, steps=2.417e+07
2023-07-07 00:08:48,456 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 6000, best=1.00, avg=1.00, std=0.00, steps=2.458e+07
2023-07-07 00:08:52,399 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 6100, best=1.00, avg=1.00, std=0.00, steps=2.499e+07
2023-07-07 00:08:56,330 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 6200, best=1.00, avg=1.00, std=0.00, steps=2.540e+07
2023-07-07 00:09:00,275 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 6300, best=1.00, avg=1.00, std=0.00, steps=2.581e+07
2023-07-07 00:09:04,257 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 6400, best=1.00, avg=1.00, std=0.00, steps=2.622e+07
2023-07-07 00:09:08,231 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 6500, best=1.00, avg=1.00, std=0.00, steps=2.663e+07
2023-07-07 00:09:12,211 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 6600, best=1.00, avg=1.00, std=0.00, steps=2.704e+07
2023-07-07 00:09:16,186 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 6700, best=1.00, avg=1.00, std=0.00, steps=2.745e+07
2023-07-07 00:09:20,146 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 6800, best=1.00, avg=1.00, std=0.00, steps=2.786e+07
2023-07-07 00:09:24,112 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 6900, best=1.00, avg=1.00, std=0.00, steps=2.827e+07
2023-07-07 00:09:28,066 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 7000, best=1.00, avg=1.00, std=0.00, steps=2.868e+07
2023-07-07 00:09:32,028 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 7100, best=1.00, avg=1.00, std=0.00, steps=2.909e+07
2023-07-07 00:09:35,995 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 7200, best=1.00, avg=1.00, std=0.00, steps=2.950e+07
2023-07-07 00:09:39,955 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 7300, best=1.00, avg=1.00, std=0.00, steps=2.990e+07
2023-07-07 00:09:43,899 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 7400, best=1.00, avg=1.00, std=0.00, steps=3.031e+07
2023-07-07 00:09:47,842 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 7500, best=1.00, avg=1.00, std=0.00, steps=3.072e+07
2023-07-07 00:09:51,783 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 7600, best=1.00, avg=1.00, std=0.00, steps=3.113e+07
2023-07-07 00:09:55,738 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 7700, best=1.00, avg=1.00, std=0.00, steps=3.154e+07
2023-07-07 00:09:59,693 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 7800, best=1.00, avg=1.00, std=0.00, steps=3.195e+07
2023-07-07 00:10:03,662 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 7900, best=1.00, avg=1.00, std=0.00, steps=3.236e+07
2023-07-07 00:10:07,589 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 8000, best=1.00, avg=1.00, std=0.00, steps=3.277e+07
2023-07-07 00:10:11,531 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 8100, best=1.00, avg=1.00, std=0.00, steps=3.318e+07
2023-07-07 00:10:15,479 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 8200, best=1.00, avg=1.00, std=0.00, steps=3.359e+07
2023-07-07 00:10:19,418 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 8300, best=1.00, avg=1.00, std=0.00, steps=3.400e+07
2023-07-07 00:10:23,347 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 8400, best=1.00, avg=1.00, std=0.00, steps=3.441e+07
2023-07-07 00:10:27,280 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 8500, best=1.00, avg=1.00, std=0.00, steps=3.482e+07
2023-07-07 00:10:31,203 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 8600, best=1.00, avg=1.00, std=0.00, steps=3.523e+07
2023-07-07 00:10:35,127 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 8700, best=1.00, avg=1.00, std=0.00, steps=3.564e+07
2023-07-07 00:10:39,051 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 8800, best=1.00, avg=1.00, std=0.00, steps=3.605e+07
2023-07-07 00:10:42,975 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 8900, best=1.00, avg=1.00, std=0.00, steps=3.646e+07
2023-07-07 00:10:46,908 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 9000, best=1.00, avg=1.00, std=0.00, steps=3.687e+07
2023-07-07 00:10:50,813 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 9100, best=1.00, avg=1.00, std=0.00, steps=3.728e+07
2023-07-07 00:10:54,729 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 9200, best=1.00, avg=1.00, std=0.00, steps=3.769e+07
2023-07-07 00:10:58,642 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 9300, best=1.00, avg=1.00, std=0.00, steps=3.810e+07
2023-07-07 00:11:02,577 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 9400, best=1.00, avg=1.00, std=0.00, steps=3.851e+07
2023-07-07 00:11:06,506 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 9500, best=1.00, avg=1.00, std=0.00, steps=3.892e+07
2023-07-07 00:11:10,449 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 9600, best=1.00, avg=1.00, std=0.00, steps=3.933e+07
2023-07-07 00:11:14,391 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 9700, best=1.00, avg=1.00, std=0.00, steps=3.974e+07
2023-07-07 00:11:18,329 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 9800, best=1.00, avg=1.00, std=0.00, steps=4.014e+07
2023-07-07 00:11:22,301 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 9900, best=1.00, avg=1.00, std=0.00, steps=4.055e+07
2023-07-07 00:11:26,256 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 10000, best=1.00, avg=1.00, std=0.00, steps=4.096e+07
2023-07-07 00:11:30,215 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 10100, best=1.00, avg=1.00, std=0.00, steps=4.137e+07
2023-07-07 00:11:34,173 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 10200, best=1.00, avg=1.00, std=0.00, steps=4.178e+07
2023-07-07 00:11:38,102 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 10300, best=1.00, avg=1.00, std=0.00, steps=4.219e+07
2023-07-07 00:11:42,036 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 10400, best=1.00, avg=1.00, std=0.00, steps=4.260e+07
2023-07-07 00:11:45,966 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 10500, best=1.00, avg=1.00, std=0.00, steps=4.301e+07
2023-07-07 00:11:49,894 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 10600, best=1.00, avg=1.00, std=0.00, steps=4.342e+07
2023-07-07 00:11:53,830 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 10700, best=1.00, avg=1.00, std=0.00, steps=4.383e+07
2023-07-07 00:11:57,756 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 10800, best=1.00, avg=1.00, std=0.00, steps=4.424e+07
2023-07-07 00:12:01,684 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 10900, best=1.00, avg=1.00, std=0.00, steps=4.465e+07
2023-07-07 00:12:05,633 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 11000, best=1.00, avg=1.00, std=0.00, steps=4.506e+07
2023-07-07 00:12:09,584 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 11100, best=1.00, avg=1.00, std=0.00, steps=4.547e+07
2023-07-07 00:12:13,539 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 11200, best=1.00, avg=1.00, std=0.00, steps=4.588e+07
2023-07-07 00:12:17,506 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 11300, best=1.00, avg=1.00, std=0.00, steps=4.629e+07
2023-07-07 00:12:21,446 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 11400, best=1.00, avg=1.00, std=0.00, steps=4.670e+07
2023-07-07 00:12:25,391 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 11500, best=1.00, avg=1.00, std=0.00, steps=4.711e+07
2023-07-07 00:12:29,329 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 11600, best=1.00, avg=1.00, std=0.00, steps=4.752e+07
2023-07-07 00:12:33,275 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 11700, best=1.00, avg=1.00, std=0.00, steps=4.793e+07
2023-07-07 00:12:37,216 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 11800, best=1.00, avg=1.00, std=0.00, steps=4.834e+07
2023-07-07 00:12:41,129 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 11900, best=1.00, avg=1.00, std=0.00, steps=4.875e+07
2023-07-07 00:12:45,011 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 0, [Train]: 11999, best=1.00, avg=1.00, std=0.00, steps=4.915e+07
2023-07-07 00:12:45,011 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 00:12:45,036 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 00:12:45,067 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 00:12:52,793 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 100, best=0.52, avg=0.50, std=0.01, steps=6.205e+05
2023-07-07 00:12:58,530 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 200, best=0.70, avg=0.69, std=0.01, steps=1.235e+06
2023-07-07 00:13:04,280 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 300, best=0.74, avg=0.72, std=0.01, steps=1.849e+06
2023-07-07 00:13:10,018 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 400, best=0.76, avg=0.75, std=0.01, steps=2.464e+06
2023-07-07 00:13:15,773 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 500, best=0.78, avg=0.77, std=0.01, steps=3.078e+06
2023-07-07 00:13:21,524 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 600, best=0.80, avg=0.79, std=0.01, steps=3.693e+06
2023-07-07 00:13:27,265 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 700, best=0.82, avg=0.81, std=0.01, steps=4.307e+06
2023-07-07 00:13:33,024 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 800, best=0.84, avg=0.82, std=0.01, steps=4.921e+06
2023-07-07 00:13:38,792 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 900, best=0.84, avg=0.83, std=0.01, steps=5.536e+06
2023-07-07 00:13:44,527 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 1000, best=0.85, avg=0.84, std=0.01, steps=6.150e+06
2023-07-07 00:13:50,261 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 1100, best=0.86, avg=0.85, std=0.01, steps=6.765e+06
2023-07-07 00:13:55,990 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 1200, best=0.87, avg=0.86, std=0.00, steps=7.379e+06
2023-07-07 00:14:01,761 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 1300, best=0.88, avg=0.87, std=0.00, steps=7.993e+06
2023-07-07 00:14:07,532 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 1400, best=0.89, avg=0.87, std=0.00, steps=8.608e+06
2023-07-07 00:14:13,270 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 1500, best=0.89, avg=0.88, std=0.00, steps=9.222e+06
2023-07-07 00:14:19,000 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 1600, best=0.89, avg=0.88, std=0.00, steps=9.837e+06
2023-07-07 00:14:24,719 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 1700, best=0.89, avg=0.88, std=0.00, steps=1.045e+07
2023-07-07 00:14:30,449 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 1800, best=0.89, avg=0.88, std=0.00, steps=1.107e+07
2023-07-07 00:14:36,201 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 1900, best=0.90, avg=0.89, std=0.00, steps=1.168e+07
2023-07-07 00:14:41,953 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 2000, best=0.90, avg=0.89, std=0.00, steps=1.229e+07
2023-07-07 00:14:47,710 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 2100, best=0.90, avg=0.89, std=0.00, steps=1.291e+07
2023-07-07 00:14:53,459 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 2200, best=0.90, avg=0.89, std=0.00, steps=1.352e+07
2023-07-07 00:14:59,228 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 2300, best=0.90, avg=0.89, std=0.00, steps=1.414e+07
2023-07-07 00:15:04,994 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 2400, best=0.90, avg=0.89, std=0.00, steps=1.475e+07
2023-07-07 00:15:10,756 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 2500, best=0.90, avg=0.89, std=0.00, steps=1.537e+07
2023-07-07 00:15:16,543 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 2600, best=0.90, avg=0.90, std=0.00, steps=1.598e+07
2023-07-07 00:15:22,323 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 2700, best=0.90, avg=0.90, std=0.00, steps=1.659e+07
2023-07-07 00:15:28,050 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 2800, best=0.90, avg=0.90, std=0.00, steps=1.721e+07
2023-07-07 00:15:33,815 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 2900, best=0.91, avg=0.90, std=0.00, steps=1.782e+07
2023-07-07 00:15:39,582 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 3000, best=0.91, avg=0.90, std=0.00, steps=1.844e+07
2023-07-07 00:15:45,311 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 3100, best=0.91, avg=0.90, std=0.00, steps=1.905e+07
2023-07-07 00:15:51,043 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 3200, best=0.91, avg=0.90, std=0.00, steps=1.967e+07
2023-07-07 00:15:56,768 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 3300, best=0.91, avg=0.90, std=0.00, steps=2.028e+07
2023-07-07 00:16:02,520 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 3400, best=0.91, avg=0.90, std=0.00, steps=2.090e+07
2023-07-07 00:16:08,297 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 3500, best=0.91, avg=0.90, std=0.00, steps=2.151e+07
2023-07-07 00:16:14,059 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 3600, best=0.91, avg=0.90, std=0.00, steps=2.212e+07
2023-07-07 00:16:19,821 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 3700, best=0.91, avg=0.90, std=0.00, steps=2.274e+07
2023-07-07 00:16:25,576 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 3800, best=0.91, avg=0.90, std=0.00, steps=2.335e+07
2023-07-07 00:16:31,353 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 3900, best=0.91, avg=0.90, std=0.00, steps=2.397e+07
2023-07-07 00:16:37,115 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 4000, best=0.91, avg=0.90, std=0.00, steps=2.458e+07
2023-07-07 00:16:42,890 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 4100, best=0.91, avg=0.90, std=0.00, steps=2.520e+07
2023-07-07 00:16:48,686 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 4200, best=0.91, avg=0.90, std=0.00, steps=2.581e+07
2023-07-07 00:16:54,460 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 4300, best=0.91, avg=0.90, std=0.00, steps=2.643e+07
2023-07-07 00:17:00,216 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 4400, best=0.91, avg=0.90, std=0.00, steps=2.704e+07
2023-07-07 00:17:05,999 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 4500, best=0.91, avg=0.90, std=0.00, steps=2.765e+07
2023-07-07 00:17:11,759 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 4600, best=0.91, avg=0.90, std=0.00, steps=2.827e+07
2023-07-07 00:17:17,523 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 4700, best=0.91, avg=0.90, std=0.00, steps=2.888e+07
2023-07-07 00:17:23,309 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 4800, best=0.91, avg=0.90, std=0.00, steps=2.950e+07
2023-07-07 00:17:29,045 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 4900, best=0.91, avg=0.90, std=0.00, steps=3.011e+07
2023-07-07 00:17:34,779 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 5000, best=0.91, avg=0.90, std=0.00, steps=3.073e+07
2023-07-07 00:17:40,519 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 5100, best=0.91, avg=0.90, std=0.00, steps=3.134e+07
2023-07-07 00:17:46,256 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 5200, best=0.91, avg=0.90, std=0.00, steps=3.195e+07
2023-07-07 00:17:52,015 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 5300, best=0.91, avg=0.90, std=0.00, steps=3.257e+07
2023-07-07 00:17:57,791 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 5400, best=0.92, avg=0.91, std=0.00, steps=3.318e+07
2023-07-07 00:18:03,541 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 5500, best=0.91, avg=0.91, std=0.00, steps=3.380e+07
2023-07-07 00:18:09,318 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 5600, best=0.91, avg=0.90, std=0.00, steps=3.441e+07
2023-07-07 00:18:15,105 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 5700, best=0.92, avg=0.90, std=0.00, steps=3.503e+07
2023-07-07 00:18:20,860 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 5800, best=0.91, avg=0.90, std=0.00, steps=3.564e+07
2023-07-07 00:18:26,600 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 5900, best=0.92, avg=0.90, std=0.00, steps=3.626e+07
2023-07-07 00:18:32,329 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 6000, best=0.91, avg=0.91, std=0.00, steps=3.687e+07
2023-07-07 00:18:38,055 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 6100, best=0.91, avg=0.91, std=0.00, steps=3.748e+07
2023-07-07 00:18:43,810 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 6200, best=0.91, avg=0.90, std=0.00, steps=3.810e+07
2023-07-07 00:18:49,537 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 6300, best=0.92, avg=0.91, std=0.00, steps=3.871e+07
2023-07-07 00:18:55,270 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 6400, best=0.92, avg=0.91, std=0.00, steps=3.933e+07
2023-07-07 00:19:01,007 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 6500, best=0.92, avg=0.91, std=0.00, steps=3.994e+07
2023-07-07 00:19:06,752 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 6600, best=0.92, avg=0.91, std=0.00, steps=4.056e+07
2023-07-07 00:19:12,491 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 6700, best=0.92, avg=0.91, std=0.00, steps=4.117e+07
2023-07-07 00:19:18,241 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 6800, best=0.92, avg=0.91, std=0.00, steps=4.179e+07
2023-07-07 00:19:23,986 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 6900, best=0.92, avg=0.91, std=0.00, steps=4.240e+07
2023-07-07 00:19:29,717 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 7000, best=0.93, avg=0.91, std=0.00, steps=4.301e+07
2023-07-07 00:19:35,461 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 7100, best=0.92, avg=0.92, std=0.00, steps=4.363e+07
2023-07-07 00:19:41,204 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 7200, best=0.93, avg=0.92, std=0.00, steps=4.424e+07
2023-07-07 00:19:46,964 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 7300, best=0.92, avg=0.92, std=0.00, steps=4.486e+07
2023-07-07 00:19:52,755 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 7400, best=0.93, avg=0.92, std=0.00, steps=4.547e+07
2023-07-07 00:19:58,503 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 7500, best=0.93, avg=0.92, std=0.00, steps=4.609e+07
2023-07-07 00:20:04,277 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 7600, best=0.93, avg=0.92, std=0.00, steps=4.670e+07
2023-07-07 00:20:10,055 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 7700, best=0.93, avg=0.92, std=0.00, steps=4.731e+07
2023-07-07 00:20:15,797 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 7800, best=0.93, avg=0.92, std=0.00, steps=4.793e+07
2023-07-07 00:20:21,558 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 7900, best=0.93, avg=0.92, std=0.00, steps=4.854e+07
2023-07-07 00:20:27,326 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 8000, best=0.93, avg=0.92, std=0.00, steps=4.916e+07
2023-07-07 00:20:33,085 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 8100, best=0.92, avg=0.92, std=0.00, steps=4.977e+07
2023-07-07 00:20:38,833 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 8200, best=0.92, avg=0.92, std=0.00, steps=5.039e+07
2023-07-07 00:20:44,621 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 8300, best=0.92, avg=0.92, std=0.00, steps=5.100e+07
2023-07-07 00:20:50,373 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 8400, best=0.92, avg=0.92, std=0.00, steps=5.162e+07
2023-07-07 00:20:56,110 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 8500, best=0.92, avg=0.92, std=0.00, steps=5.223e+07
2023-07-07 00:21:01,860 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 8600, best=0.93, avg=0.92, std=0.00, steps=5.284e+07
2023-07-07 00:21:07,606 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 8700, best=0.93, avg=0.92, std=0.00, steps=5.346e+07
2023-07-07 00:21:13,336 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 8800, best=0.92, avg=0.92, std=0.00, steps=5.407e+07
2023-07-07 00:21:19,095 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 8900, best=0.92, avg=0.91, std=0.00, steps=5.469e+07
2023-07-07 00:21:24,848 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 9000, best=0.93, avg=0.92, std=0.00, steps=5.530e+07
2023-07-07 00:21:30,595 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 9100, best=0.93, avg=0.92, std=0.00, steps=5.592e+07
2023-07-07 00:21:36,331 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 9200, best=0.92, avg=0.92, std=0.00, steps=5.653e+07
2023-07-07 00:21:42,069 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 9300, best=0.93, avg=0.92, std=0.00, steps=5.715e+07
2023-07-07 00:21:47,816 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 9400, best=0.93, avg=0.92, std=0.00, steps=5.776e+07
2023-07-07 00:21:53,566 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 9500, best=0.93, avg=0.92, std=0.00, steps=5.837e+07
2023-07-07 00:21:59,345 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 9600, best=0.93, avg=0.92, std=0.00, steps=5.899e+07
2023-07-07 00:22:05,101 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 9700, best=0.92, avg=0.92, std=0.00, steps=5.960e+07
2023-07-07 00:22:10,842 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 9800, best=0.93, avg=0.91, std=0.00, steps=6.022e+07
2023-07-07 00:22:16,611 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 9900, best=0.93, avg=0.92, std=0.00, steps=6.083e+07
2023-07-07 00:22:22,397 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 10000, best=0.93, avg=0.92, std=0.00, steps=6.145e+07
2023-07-07 00:22:28,200 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 10100, best=0.93, avg=0.92, std=0.00, steps=6.206e+07
2023-07-07 00:22:33,961 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 10200, best=0.93, avg=0.92, std=0.00, steps=6.267e+07
2023-07-07 00:22:39,699 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 10300, best=0.93, avg=0.92, std=0.00, steps=6.329e+07
2023-07-07 00:22:45,437 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 10400, best=0.93, avg=0.92, std=0.00, steps=6.390e+07
2023-07-07 00:22:51,181 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 10500, best=0.92, avg=0.92, std=0.00, steps=6.452e+07
2023-07-07 00:22:56,924 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 10600, best=0.93, avg=0.92, std=0.00, steps=6.513e+07
2023-07-07 00:23:02,672 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 10700, best=0.92, avg=0.92, std=0.00, steps=6.575e+07
2023-07-07 00:23:08,410 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 10800, best=0.93, avg=0.92, std=0.00, steps=6.636e+07
2023-07-07 00:23:14,139 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 10900, best=0.92, avg=0.92, std=0.00, steps=6.698e+07
2023-07-07 00:23:19,866 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 11000, best=0.92, avg=0.92, std=0.00, steps=6.759e+07
2023-07-07 00:23:25,612 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 11100, best=0.93, avg=0.92, std=0.00, steps=6.820e+07
2023-07-07 00:23:31,356 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 11200, best=0.93, avg=0.92, std=0.00, steps=6.882e+07
2023-07-07 00:23:37,111 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 11300, best=0.92, avg=0.92, std=0.00, steps=6.943e+07
2023-07-07 00:23:42,848 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 11400, best=0.93, avg=0.92, std=0.00, steps=7.005e+07
2023-07-07 00:23:48,579 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 11500, best=0.93, avg=0.92, std=0.00, steps=7.066e+07
2023-07-07 00:23:54,320 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 11600, best=0.93, avg=0.92, std=0.00, steps=7.128e+07
2023-07-07 00:24:00,049 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 11700, best=0.93, avg=0.92, std=0.00, steps=7.189e+07
2023-07-07 00:24:05,787 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 11800, best=0.93, avg=0.92, std=0.00, steps=7.251e+07
2023-07-07 00:24:11,508 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 11900, best=0.92, avg=0.92, std=0.00, steps=7.312e+07
2023-07-07 00:24:17,208 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 0, [Train]: 11999, best=0.92, avg=0.92, std=0.00, steps=7.373e+07
2023-07-07 00:24:17,209 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 00:24:17,232 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 00:24:17,262 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 00:24:26,885 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 100, best=0.52, avg=0.50, std=0.01, steps=8.274e+05
2023-07-07 00:24:34,495 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 200, best=0.68, avg=0.66, std=0.01, steps=1.647e+06
2023-07-07 00:24:42,084 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 300, best=0.72, avg=0.70, std=0.01, steps=2.466e+06
2023-07-07 00:24:49,656 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 400, best=0.73, avg=0.71, std=0.01, steps=3.285e+06
2023-07-07 00:24:57,204 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 500, best=0.74, avg=0.73, std=0.01, steps=4.104e+06
2023-07-07 00:25:04,749 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 600, best=0.76, avg=0.74, std=0.01, steps=4.923e+06
2023-07-07 00:25:12,324 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 700, best=0.77, avg=0.76, std=0.01, steps=5.743e+06
2023-07-07 00:25:19,887 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 800, best=0.79, avg=0.77, std=0.01, steps=6.562e+06
2023-07-07 00:25:27,472 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 900, best=0.79, avg=0.77, std=0.01, steps=7.381e+06
2023-07-07 00:25:35,045 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 1000, best=0.80, avg=0.78, std=0.01, steps=8.200e+06
2023-07-07 00:25:42,613 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 1100, best=0.80, avg=0.79, std=0.01, steps=9.019e+06
2023-07-07 00:25:50,185 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 1200, best=0.81, avg=0.80, std=0.01, steps=9.839e+06
2023-07-07 00:25:57,740 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 1300, best=0.82, avg=0.80, std=0.00, steps=1.066e+07
2023-07-07 00:26:05,326 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 1400, best=0.83, avg=0.81, std=0.01, steps=1.148e+07
2023-07-07 00:26:12,926 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 1500, best=0.84, avg=0.82, std=0.00, steps=1.230e+07
2023-07-07 00:26:20,528 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 1600, best=0.84, avg=0.83, std=0.00, steps=1.312e+07
2023-07-07 00:26:28,129 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 1700, best=0.85, avg=0.83, std=0.01, steps=1.393e+07
2023-07-07 00:26:35,733 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 1800, best=0.85, avg=0.83, std=0.01, steps=1.475e+07
2023-07-07 00:26:43,329 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 1900, best=0.85, avg=0.84, std=0.00, steps=1.557e+07
2023-07-07 00:26:50,881 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 2000, best=0.85, avg=0.84, std=0.00, steps=1.639e+07
2023-07-07 00:26:58,449 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 2100, best=0.85, avg=0.84, std=0.00, steps=1.721e+07
2023-07-07 00:27:06,020 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 2200, best=0.85, avg=0.84, std=0.00, steps=1.803e+07
2023-07-07 00:27:13,583 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 2300, best=0.85, avg=0.84, std=0.01, steps=1.885e+07
2023-07-07 00:27:21,184 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 2400, best=0.86, avg=0.84, std=0.01, steps=1.967e+07
2023-07-07 00:27:28,796 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 2500, best=0.85, avg=0.85, std=0.00, steps=2.049e+07
2023-07-07 00:27:36,382 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 2600, best=0.86, avg=0.85, std=0.00, steps=2.131e+07
2023-07-07 00:27:43,990 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 2700, best=0.86, avg=0.85, std=0.00, steps=2.213e+07
2023-07-07 00:27:51,587 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 2800, best=0.86, avg=0.85, std=0.00, steps=2.295e+07
2023-07-07 00:27:59,118 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 2900, best=0.86, avg=0.85, std=0.00, steps=2.376e+07
2023-07-07 00:28:06,664 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 3000, best=0.87, avg=0.85, std=0.00, steps=2.458e+07
2023-07-07 00:28:14,193 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 3100, best=0.86, avg=0.85, std=0.00, steps=2.540e+07
2023-07-07 00:28:21,765 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 3200, best=0.86, avg=0.85, std=0.00, steps=2.622e+07
2023-07-07 00:28:29,358 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 3300, best=0.87, avg=0.86, std=0.00, steps=2.704e+07
2023-07-07 00:28:36,970 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 3400, best=0.87, avg=0.86, std=0.00, steps=2.786e+07
2023-07-07 00:28:44,578 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 3500, best=0.87, avg=0.86, std=0.00, steps=2.868e+07
2023-07-07 00:28:52,187 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 3600, best=0.87, avg=0.86, std=0.00, steps=2.950e+07
2023-07-07 00:28:59,752 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 3700, best=0.87, avg=0.86, std=0.00, steps=3.032e+07
2023-07-07 00:29:07,314 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 3800, best=0.87, avg=0.86, std=0.00, steps=3.114e+07
2023-07-07 00:29:14,898 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 3900, best=0.87, avg=0.86, std=0.00, steps=3.196e+07
2023-07-07 00:29:22,487 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 4000, best=0.87, avg=0.86, std=0.00, steps=3.278e+07
2023-07-07 00:29:30,092 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 4100, best=0.88, avg=0.87, std=0.00, steps=3.360e+07
2023-07-07 00:29:37,705 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 4200, best=0.88, avg=0.87, std=0.00, steps=3.441e+07
2023-07-07 00:29:45,243 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 4300, best=0.88, avg=0.87, std=0.00, steps=3.523e+07
2023-07-07 00:29:52,787 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 4400, best=0.88, avg=0.87, std=0.00, steps=3.605e+07
2023-07-07 00:30:00,342 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 4500, best=0.89, avg=0.88, std=0.00, steps=3.687e+07
2023-07-07 00:30:07,901 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 4600, best=0.89, avg=0.88, std=0.00, steps=3.769e+07
2023-07-07 00:30:15,499 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 4700, best=0.89, avg=0.88, std=0.00, steps=3.851e+07
2023-07-07 00:30:23,120 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 4800, best=0.89, avg=0.88, std=0.00, steps=3.933e+07
2023-07-07 00:30:30,729 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 4900, best=0.89, avg=0.88, std=0.00, steps=4.015e+07
2023-07-07 00:30:38,338 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 5000, best=0.89, avg=0.88, std=0.00, steps=4.097e+07
2023-07-07 00:30:45,925 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 5100, best=0.89, avg=0.88, std=0.00, steps=4.179e+07
2023-07-07 00:30:53,484 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 5200, best=0.89, avg=0.88, std=0.00, steps=4.261e+07
2023-07-07 00:31:01,043 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 5300, best=0.89, avg=0.88, std=0.00, steps=4.343e+07
2023-07-07 00:31:08,609 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 5400, best=0.89, avg=0.88, std=0.00, steps=4.424e+07
2023-07-07 00:31:16,169 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 5500, best=0.89, avg=0.88, std=0.00, steps=4.506e+07
2023-07-07 00:31:23,741 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 5600, best=0.89, avg=0.88, std=0.00, steps=4.588e+07
2023-07-07 00:31:31,316 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 5700, best=0.89, avg=0.88, std=0.00, steps=4.670e+07
2023-07-07 00:31:38,893 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 5800, best=0.89, avg=0.88, std=0.00, steps=4.752e+07
2023-07-07 00:31:46,512 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 5900, best=0.89, avg=0.88, std=0.00, steps=4.834e+07
2023-07-07 00:31:54,096 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 6000, best=0.89, avg=0.88, std=0.00, steps=4.916e+07
2023-07-07 00:32:01,654 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 6100, best=0.89, avg=0.88, std=0.00, steps=4.998e+07
2023-07-07 00:32:09,196 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 6200, best=0.89, avg=0.88, std=0.00, steps=5.080e+07
2023-07-07 00:32:16,743 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 6300, best=0.89, avg=0.88, std=0.00, steps=5.162e+07
2023-07-07 00:32:24,305 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 6400, best=0.89, avg=0.88, std=0.00, steps=5.244e+07
2023-07-07 00:32:31,870 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 6500, best=0.89, avg=0.88, std=0.00, steps=5.326e+07
2023-07-07 00:32:39,410 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 6600, best=0.89, avg=0.88, std=0.00, steps=5.408e+07
2023-07-07 00:32:46,952 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 6700, best=0.89, avg=0.88, std=0.00, steps=5.489e+07
2023-07-07 00:32:54,496 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 6800, best=0.89, avg=0.88, std=0.00, steps=5.571e+07
2023-07-07 00:33:02,052 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 6900, best=0.89, avg=0.88, std=0.00, steps=5.653e+07
2023-07-07 00:33:09,597 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 7000, best=0.89, avg=0.88, std=0.00, steps=5.735e+07
2023-07-07 00:33:17,173 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 7100, best=0.89, avg=0.88, std=0.00, steps=5.817e+07
2023-07-07 00:33:24,793 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 7200, best=0.89, avg=0.88, std=0.00, steps=5.899e+07
2023-07-07 00:33:32,383 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 7300, best=0.89, avg=0.88, std=0.00, steps=5.981e+07
2023-07-07 00:33:39,946 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 7400, best=0.89, avg=0.88, std=0.00, steps=6.063e+07
2023-07-07 00:33:47,512 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 7500, best=0.89, avg=0.88, std=0.00, steps=6.145e+07
2023-07-07 00:33:55,069 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 7600, best=0.89, avg=0.88, std=0.00, steps=6.227e+07
2023-07-07 00:34:02,618 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 7700, best=0.89, avg=0.88, std=0.00, steps=6.309e+07
2023-07-07 00:34:10,173 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 7800, best=0.89, avg=0.88, std=0.00, steps=6.391e+07
2023-07-07 00:34:17,720 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 7900, best=0.89, avg=0.88, std=0.00, steps=6.472e+07
2023-07-07 00:34:25,268 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 8000, best=0.89, avg=0.88, std=0.00, steps=6.554e+07
2023-07-07 00:34:32,816 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 8100, best=0.89, avg=0.88, std=0.00, steps=6.636e+07
2023-07-07 00:34:40,367 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 8200, best=0.90, avg=0.88, std=0.00, steps=6.718e+07
2023-07-07 00:34:47,949 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 8300, best=0.90, avg=0.88, std=0.00, steps=6.800e+07
2023-07-07 00:34:55,547 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 8400, best=0.89, avg=0.88, std=0.00, steps=6.882e+07
2023-07-07 00:35:03,095 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 8500, best=0.89, avg=0.88, std=0.00, steps=6.964e+07
2023-07-07 00:35:10,667 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 8600, best=0.89, avg=0.88, std=0.00, steps=7.046e+07
2023-07-07 00:35:18,224 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 8700, best=0.89, avg=0.88, std=0.00, steps=7.128e+07
2023-07-07 00:35:25,816 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 8800, best=0.89, avg=0.88, std=0.00, steps=7.210e+07
2023-07-07 00:35:33,429 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 8900, best=0.89, avg=0.88, std=0.00, steps=7.292e+07
2023-07-07 00:35:41,045 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 9000, best=0.89, avg=0.88, std=0.00, steps=7.374e+07
2023-07-07 00:35:48,606 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 9100, best=0.89, avg=0.88, std=0.00, steps=7.456e+07
2023-07-07 00:35:56,160 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 9200, best=0.89, avg=0.88, std=0.00, steps=7.537e+07
2023-07-07 00:36:03,724 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 9300, best=0.89, avg=0.88, std=0.00, steps=7.619e+07
2023-07-07 00:36:11,286 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 9400, best=0.89, avg=0.88, std=0.00, steps=7.701e+07
2023-07-07 00:36:18,871 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 9500, best=0.89, avg=0.88, std=0.00, steps=7.783e+07
2023-07-07 00:36:26,471 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 9600, best=0.89, avg=0.88, std=0.00, steps=7.865e+07
2023-07-07 00:36:34,055 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 9700, best=0.89, avg=0.88, std=0.00, steps=7.947e+07
2023-07-07 00:36:41,654 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 9800, best=0.89, avg=0.88, std=0.00, steps=8.029e+07
2023-07-07 00:36:49,259 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 9900, best=0.90, avg=0.88, std=0.00, steps=8.111e+07
2023-07-07 00:36:56,846 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 10000, best=0.89, avg=0.88, std=0.00, steps=8.193e+07
2023-07-07 00:37:04,403 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 10100, best=0.89, avg=0.88, std=0.00, steps=8.275e+07
2023-07-07 00:37:11,972 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 10200, best=0.89, avg=0.88, std=0.00, steps=8.357e+07
2023-07-07 00:37:19,531 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 10300, best=0.89, avg=0.88, std=0.00, steps=8.439e+07
2023-07-07 00:37:27,089 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 10400, best=0.89, avg=0.88, std=0.00, steps=8.520e+07
2023-07-07 00:37:34,679 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 10500, best=0.89, avg=0.88, std=0.00, steps=8.602e+07
2023-07-07 00:37:42,271 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 10600, best=0.89, avg=0.88, std=0.00, steps=8.684e+07
2023-07-07 00:37:49,887 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 10700, best=0.89, avg=0.88, std=0.00, steps=8.766e+07
2023-07-07 00:37:57,513 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 10800, best=0.89, avg=0.88, std=0.00, steps=8.848e+07
2023-07-07 00:38:05,131 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 10900, best=0.89, avg=0.88, std=0.00, steps=8.930e+07
2023-07-07 00:38:12,728 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 11000, best=0.89, avg=0.88, std=0.00, steps=9.012e+07
2023-07-07 00:38:20,297 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 11100, best=0.89, avg=0.88, std=0.00, steps=9.094e+07
2023-07-07 00:38:27,883 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 11200, best=0.89, avg=0.88, std=0.00, steps=9.176e+07
2023-07-07 00:38:35,492 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 11300, best=0.89, avg=0.88, std=0.00, steps=9.258e+07
2023-07-07 00:38:43,127 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 11400, best=0.89, avg=0.88, std=0.00, steps=9.340e+07
2023-07-07 00:38:50,690 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 11500, best=0.89, avg=0.88, std=0.00, steps=9.422e+07
2023-07-07 00:38:58,248 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 11600, best=0.89, avg=0.88, std=0.00, steps=9.504e+07
2023-07-07 00:39:05,802 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 11700, best=0.89, avg=0.88, std=0.00, steps=9.585e+07
2023-07-07 00:39:13,357 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 11800, best=0.89, avg=0.88, std=0.00, steps=9.667e+07
2023-07-07 00:39:20,912 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 11900, best=0.89, avg=0.88, std=0.00, steps=9.749e+07
2023-07-07 00:39:28,384 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 0, [Train]: 11999, best=0.89, avg=0.88, std=0.00, steps=9.830e+07
2023-07-07 00:39:28,385 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 00:39:28,408 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 00:39:28,438 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 00:39:41,715 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 100, best=0.52, avg=0.50, std=0.01, steps=1.241e+06
2023-07-07 00:39:52,946 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 200, best=0.52, avg=0.50, std=0.01, steps=2.470e+06
2023-07-07 00:40:04,181 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 300, best=0.52, avg=0.50, std=0.01, steps=3.699e+06
2023-07-07 00:40:15,414 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 400, best=0.52, avg=0.50, std=0.01, steps=4.927e+06
2023-07-07 00:40:26,693 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 500, best=0.52, avg=0.50, std=0.01, steps=6.156e+06
2023-07-07 00:40:37,884 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 600, best=0.52, avg=0.50, std=0.01, steps=7.385e+06
2023-07-07 00:40:49,082 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 700, best=0.52, avg=0.50, std=0.01, steps=8.614e+06
2023-07-07 00:41:00,290 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 800, best=0.52, avg=0.50, std=0.01, steps=9.843e+06
2023-07-07 00:41:11,487 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 900, best=0.52, avg=0.50, std=0.01, steps=1.107e+07
2023-07-07 00:41:22,687 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 1000, best=0.52, avg=0.50, std=0.01, steps=1.230e+07
2023-07-07 00:41:33,919 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 1100, best=0.52, avg=0.50, std=0.01, steps=1.353e+07
2023-07-07 00:41:45,112 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 1200, best=0.52, avg=0.50, std=0.01, steps=1.476e+07
2023-07-07 00:41:56,303 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 1300, best=0.52, avg=0.50, std=0.01, steps=1.599e+07
2023-07-07 00:42:07,509 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 1400, best=0.51, avg=0.50, std=0.01, steps=1.722e+07
2023-07-07 00:42:18,707 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 1500, best=0.52, avg=0.50, std=0.01, steps=1.844e+07
2023-07-07 00:42:29,973 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 1600, best=0.52, avg=0.50, std=0.01, steps=1.967e+07
2023-07-07 00:42:41,237 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 1700, best=0.52, avg=0.50, std=0.01, steps=2.090e+07
2023-07-07 00:42:52,443 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 1800, best=0.52, avg=0.50, std=0.01, steps=2.213e+07
2023-07-07 00:43:03,656 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 1900, best=0.52, avg=0.50, std=0.01, steps=2.336e+07
2023-07-07 00:43:14,830 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 2000, best=0.52, avg=0.50, std=0.01, steps=2.459e+07
2023-07-07 00:43:26,000 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 2100, best=0.52, avg=0.50, std=0.01, steps=2.582e+07
2023-07-07 00:43:37,208 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 2200, best=0.53, avg=0.50, std=0.01, steps=2.705e+07
2023-07-07 00:43:48,393 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 2300, best=0.52, avg=0.50, std=0.01, steps=2.827e+07
2023-07-07 00:43:59,585 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 2400, best=0.52, avg=0.50, std=0.01, steps=2.950e+07
2023-07-07 00:44:10,775 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 2500, best=0.53, avg=0.50, std=0.01, steps=3.073e+07
2023-07-07 00:44:21,978 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 2600, best=0.52, avg=0.50, std=0.01, steps=3.196e+07
2023-07-07 00:44:33,175 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 2700, best=0.52, avg=0.50, std=0.01, steps=3.319e+07
2023-07-07 00:44:44,405 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 2800, best=0.52, avg=0.50, std=0.01, steps=3.442e+07
2023-07-07 00:44:55,693 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 2900, best=0.52, avg=0.50, std=0.01, steps=3.565e+07
2023-07-07 00:45:06,976 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 3000, best=0.52, avg=0.50, std=0.01, steps=3.688e+07
2023-07-07 00:45:18,255 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 3100, best=0.52, avg=0.50, std=0.01, steps=3.811e+07
2023-07-07 00:45:29,503 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 3200, best=0.52, avg=0.50, std=0.01, steps=3.933e+07
2023-07-07 00:45:40,739 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 3300, best=0.53, avg=0.50, std=0.01, steps=4.056e+07
2023-07-07 00:45:52,038 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 3400, best=0.52, avg=0.50, std=0.01, steps=4.179e+07
2023-07-07 00:46:03,324 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 3500, best=0.52, avg=0.50, std=0.01, steps=4.302e+07
2023-07-07 00:46:14,613 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 3600, best=0.52, avg=0.50, std=0.01, steps=4.425e+07
2023-07-07 00:46:25,897 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 3700, best=0.52, avg=0.50, std=0.01, steps=4.548e+07
2023-07-07 00:46:37,178 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 3800, best=0.52, avg=0.50, std=0.01, steps=4.671e+07
2023-07-07 00:46:48,402 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 3900, best=0.53, avg=0.50, std=0.01, steps=4.794e+07
2023-07-07 00:46:59,574 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 4000, best=0.52, avg=0.50, std=0.01, steps=4.916e+07
2023-07-07 00:47:10,825 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 4100, best=0.52, avg=0.50, std=0.01, steps=5.039e+07
2023-07-07 00:47:22,114 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 4200, best=0.52, avg=0.50, std=0.01, steps=5.162e+07
2023-07-07 00:47:33,396 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 4300, best=0.52, avg=0.50, std=0.01, steps=5.285e+07
2023-07-07 00:47:44,656 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 4400, best=0.52, avg=0.50, std=0.01, steps=5.408e+07
2023-07-07 00:47:55,856 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 4500, best=0.52, avg=0.50, std=0.01, steps=5.531e+07
2023-07-07 00:48:07,040 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 4600, best=0.52, avg=0.50, std=0.01, steps=5.654e+07
2023-07-07 00:48:18,221 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 4700, best=0.52, avg=0.50, std=0.01, steps=5.777e+07
2023-07-07 00:48:29,418 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 4800, best=0.52, avg=0.50, std=0.01, steps=5.899e+07
2023-07-07 00:48:40,657 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 4900, best=0.53, avg=0.50, std=0.01, steps=6.022e+07
2023-07-07 00:48:51,876 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 5000, best=0.52, avg=0.50, std=0.01, steps=6.145e+07
2023-07-07 00:49:03,078 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 5100, best=0.53, avg=0.50, std=0.01, steps=6.268e+07
2023-07-07 00:49:14,261 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 5200, best=0.51, avg=0.50, std=0.01, steps=6.391e+07
2023-07-07 00:49:25,476 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 5300, best=0.52, avg=0.50, std=0.01, steps=6.514e+07
2023-07-07 00:49:36,700 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 5400, best=0.52, avg=0.50, std=0.01, steps=6.637e+07
2023-07-07 00:49:47,957 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 5500, best=0.52, avg=0.50, std=0.01, steps=6.760e+07
2023-07-07 00:49:59,195 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 5600, best=0.52, avg=0.50, std=0.01, steps=6.883e+07
2023-07-07 00:50:10,403 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 5700, best=0.52, avg=0.50, std=0.01, steps=7.005e+07
2023-07-07 00:50:21,598 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 5800, best=0.52, avg=0.50, std=0.01, steps=7.128e+07
2023-07-07 00:50:32,860 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 5900, best=0.52, avg=0.50, std=0.01, steps=7.251e+07
2023-07-07 00:50:44,088 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 6000, best=0.52, avg=0.50, std=0.01, steps=7.374e+07
2023-07-07 00:50:55,246 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 6100, best=0.52, avg=0.50, std=0.01, steps=7.497e+07
2023-07-07 00:51:06,444 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 6200, best=0.52, avg=0.50, std=0.01, steps=7.620e+07
2023-07-07 00:51:17,661 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 6300, best=0.52, avg=0.50, std=0.01, steps=7.743e+07
2023-07-07 00:51:28,914 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 6400, best=0.52, avg=0.50, std=0.01, steps=7.866e+07
2023-07-07 00:51:40,126 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 6500, best=0.52, avg=0.50, std=0.01, steps=7.988e+07
2023-07-07 00:51:51,310 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 6600, best=0.52, avg=0.50, std=0.01, steps=8.111e+07
2023-07-07 00:52:02,486 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 6700, best=0.52, avg=0.50, std=0.01, steps=8.234e+07
2023-07-07 00:52:13,674 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 6800, best=0.52, avg=0.50, std=0.01, steps=8.357e+07
2023-07-07 00:52:24,880 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 6900, best=0.52, avg=0.50, std=0.01, steps=8.480e+07
2023-07-07 00:52:36,093 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 7000, best=0.53, avg=0.50, std=0.01, steps=8.603e+07
2023-07-07 00:52:47,353 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 7100, best=0.52, avg=0.50, std=0.01, steps=8.726e+07
2023-07-07 00:52:58,565 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 7200, best=0.52, avg=0.50, std=0.01, steps=8.849e+07
2023-07-07 00:53:09,799 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 7300, best=0.52, avg=0.50, std=0.01, steps=8.971e+07
2023-07-07 00:53:20,989 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 7400, best=0.52, avg=0.50, std=0.01, steps=9.094e+07
2023-07-07 00:53:32,241 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 7500, best=0.52, avg=0.50, std=0.01, steps=9.217e+07
2023-07-07 00:53:43,507 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 7600, best=0.52, avg=0.50, std=0.01, steps=9.340e+07
2023-07-07 00:53:54,706 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 7700, best=0.52, avg=0.50, std=0.01, steps=9.463e+07
2023-07-07 00:54:05,894 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 7800, best=0.52, avg=0.50, std=0.01, steps=9.586e+07
2023-07-07 00:54:17,062 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 7900, best=0.52, avg=0.50, std=0.01, steps=9.709e+07
2023-07-07 00:54:28,237 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 8000, best=0.51, avg=0.50, std=0.01, steps=9.832e+07
2023-07-07 00:54:39,429 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 8100, best=0.52, avg=0.50, std=0.01, steps=9.955e+07
2023-07-07 00:54:50,650 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 8200, best=0.52, avg=0.50, std=0.01, steps=1.008e+08
2023-07-07 00:55:01,848 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 8300, best=0.52, avg=0.50, std=0.01, steps=1.020e+08
2023-07-07 00:55:13,059 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 8400, best=0.52, avg=0.50, std=0.01, steps=1.032e+08
2023-07-07 00:55:24,265 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 8500, best=0.51, avg=0.50, std=0.01, steps=1.045e+08
2023-07-07 00:55:35,508 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 8600, best=0.52, avg=0.50, std=0.01, steps=1.057e+08
2023-07-07 00:55:46,710 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 8700, best=0.52, avg=0.50, std=0.01, steps=1.069e+08
2023-07-07 00:55:57,944 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 8800, best=0.52, avg=0.50, std=0.01, steps=1.081e+08
2023-07-07 00:56:09,169 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 8900, best=0.52, avg=0.50, std=0.01, steps=1.094e+08
2023-07-07 00:56:20,364 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 9000, best=0.52, avg=0.50, std=0.01, steps=1.106e+08
2023-07-07 00:56:31,593 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 9100, best=0.52, avg=0.50, std=0.01, steps=1.118e+08
2023-07-07 00:56:42,847 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 9200, best=0.52, avg=0.50, std=0.01, steps=1.131e+08
2023-07-07 00:56:54,071 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 9300, best=0.52, avg=0.50, std=0.01, steps=1.143e+08
2023-07-07 00:57:05,337 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 9400, best=0.53, avg=0.50, std=0.01, steps=1.155e+08
2023-07-07 00:57:16,558 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 9500, best=0.52, avg=0.50, std=0.01, steps=1.167e+08
2023-07-07 00:57:27,720 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 9600, best=0.65, avg=0.64, std=0.01, steps=1.180e+08
2023-07-07 00:57:38,927 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 9700, best=0.68, avg=0.66, std=0.00, steps=1.192e+08
2023-07-07 00:57:50,117 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 9800, best=0.70, avg=0.68, std=0.01, steps=1.204e+08
2023-07-07 00:58:01,344 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 9900, best=0.72, avg=0.70, std=0.01, steps=1.217e+08
2023-07-07 00:58:12,591 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 10000, best=0.72, avg=0.70, std=0.01, steps=1.229e+08
2023-07-07 00:58:23,791 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 10100, best=0.72, avg=0.71, std=0.01, steps=1.241e+08
2023-07-07 00:58:35,073 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 10200, best=0.73, avg=0.71, std=0.01, steps=1.253e+08
2023-07-07 00:58:46,287 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 10300, best=0.73, avg=0.72, std=0.01, steps=1.266e+08
2023-07-07 00:58:57,484 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 10400, best=0.73, avg=0.72, std=0.00, steps=1.278e+08
2023-07-07 00:59:08,685 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 10500, best=0.74, avg=0.72, std=0.01, steps=1.290e+08
2023-07-07 00:59:19,884 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 10600, best=0.74, avg=0.73, std=0.01, steps=1.303e+08
2023-07-07 00:59:31,140 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 10700, best=0.74, avg=0.73, std=0.01, steps=1.315e+08
2023-07-07 00:59:42,421 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 10800, best=0.74, avg=0.73, std=0.01, steps=1.327e+08
2023-07-07 00:59:53,745 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 10900, best=0.75, avg=0.73, std=0.01, steps=1.340e+08
2023-07-07 01:00:04,955 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 11000, best=0.75, avg=0.73, std=0.01, steps=1.352e+08
2023-07-07 01:00:16,163 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 11100, best=0.75, avg=0.73, std=0.01, steps=1.364e+08
2023-07-07 01:00:27,355 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 11200, best=0.76, avg=0.74, std=0.01, steps=1.376e+08
2023-07-07 01:00:38,564 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 11300, best=0.76, avg=0.75, std=0.01, steps=1.389e+08
2023-07-07 01:00:49,808 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 11400, best=0.76, avg=0.74, std=0.01, steps=1.401e+08
2023-07-07 01:01:01,054 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 11500, best=0.76, avg=0.75, std=0.01, steps=1.413e+08
2023-07-07 01:01:12,254 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 11600, best=0.76, avg=0.75, std=0.01, steps=1.426e+08
2023-07-07 01:01:23,484 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 11700, best=0.77, avg=0.75, std=0.01, steps=1.438e+08
2023-07-07 01:01:34,702 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 11800, best=0.77, avg=0.75, std=0.01, steps=1.450e+08
2023-07-07 01:01:45,962 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 11900, best=0.76, avg=0.75, std=0.01, steps=1.462e+08
2023-07-07 01:01:57,136 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 0, [Train]: 11999, best=0.77, avg=0.76, std=0.01, steps=1.475e+08
2023-07-07 01:01:57,136 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 01:01:57,158 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 01:01:57,186 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 01:02:06,915 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 100, best=0.64, avg=0.63, std=0.00, steps=8.274e+05
2023-07-07 01:02:14,469 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 200, best=0.71, avg=0.70, std=0.00, steps=1.647e+06
2023-07-07 01:02:22,071 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 300, best=0.76, avg=0.75, std=0.00, steps=2.466e+06
2023-07-07 01:02:29,640 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 400, best=0.78, avg=0.77, std=0.00, steps=3.285e+06
2023-07-07 01:02:37,208 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 500, best=0.79, avg=0.78, std=0.00, steps=4.104e+06
2023-07-07 01:02:44,772 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 600, best=0.80, avg=0.79, std=0.00, steps=4.923e+06
2023-07-07 01:02:52,313 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 700, best=0.82, avg=0.81, std=0.00, steps=5.743e+06
2023-07-07 01:02:59,877 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 800, best=0.83, avg=0.82, std=0.00, steps=6.562e+06
2023-07-07 01:03:07,477 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 900, best=0.85, avg=0.83, std=0.00, steps=7.381e+06
2023-07-07 01:03:15,023 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 1000, best=0.86, avg=0.85, std=0.00, steps=8.200e+06
2023-07-07 01:03:22,548 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 1100, best=0.86, avg=0.85, std=0.00, steps=9.019e+06
2023-07-07 01:03:30,122 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 1200, best=0.87, avg=0.86, std=0.00, steps=9.839e+06
2023-07-07 01:03:37,709 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 1300, best=0.87, avg=0.87, std=0.00, steps=1.066e+07
2023-07-07 01:03:45,292 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 1400, best=0.88, avg=0.87, std=0.00, steps=1.148e+07
2023-07-07 01:03:52,844 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 1500, best=0.88, avg=0.88, std=0.00, steps=1.230e+07
2023-07-07 01:04:00,381 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 1600, best=0.89, avg=0.88, std=0.00, steps=1.312e+07
2023-07-07 01:04:07,933 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 1700, best=0.89, avg=0.88, std=0.00, steps=1.393e+07
2023-07-07 01:04:15,473 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 1800, best=0.89, avg=0.88, std=0.00, steps=1.475e+07
2023-07-07 01:04:23,034 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 1900, best=0.89, avg=0.89, std=0.00, steps=1.557e+07
2023-07-07 01:04:30,616 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 2000, best=0.90, avg=0.89, std=0.00, steps=1.639e+07
2023-07-07 01:04:38,170 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 2100, best=0.90, avg=0.89, std=0.00, steps=1.721e+07
2023-07-07 01:04:45,711 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 2200, best=0.90, avg=0.89, std=0.00, steps=1.803e+07
2023-07-07 01:04:53,273 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 2300, best=0.90, avg=0.89, std=0.00, steps=1.885e+07
2023-07-07 01:05:00,829 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 2400, best=0.90, avg=0.90, std=0.00, steps=1.967e+07
2023-07-07 01:05:08,394 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 2500, best=0.90, avg=0.90, std=0.00, steps=2.049e+07
2023-07-07 01:05:16,011 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 2600, best=0.91, avg=0.90, std=0.00, steps=2.131e+07
2023-07-07 01:05:23,627 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 2700, best=0.91, avg=0.90, std=0.00, steps=2.213e+07
2023-07-07 01:05:31,211 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 2800, best=0.91, avg=0.90, std=0.00, steps=2.295e+07
2023-07-07 01:05:38,752 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 2900, best=0.91, avg=0.90, std=0.00, steps=2.376e+07
2023-07-07 01:05:46,322 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 3000, best=0.91, avg=0.90, std=0.00, steps=2.458e+07
2023-07-07 01:05:53,876 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 3100, best=0.91, avg=0.90, std=0.00, steps=2.540e+07
2023-07-07 01:06:01,410 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 3200, best=0.91, avg=0.90, std=0.00, steps=2.622e+07
2023-07-07 01:06:08,967 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 3300, best=0.91, avg=0.90, std=0.00, steps=2.704e+07
2023-07-07 01:06:16,522 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 3400, best=0.91, avg=0.90, std=0.00, steps=2.786e+07
2023-07-07 01:06:24,072 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 3500, best=0.91, avg=0.90, std=0.00, steps=2.868e+07
2023-07-07 01:06:31,617 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 3600, best=0.91, avg=0.90, std=0.00, steps=2.950e+07
2023-07-07 01:06:39,161 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 3700, best=0.91, avg=0.91, std=0.00, steps=3.032e+07
2023-07-07 01:06:46,727 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 3800, best=0.91, avg=0.91, std=0.00, steps=3.114e+07
2023-07-07 01:06:54,267 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 3900, best=0.91, avg=0.91, std=0.00, steps=3.196e+07
2023-07-07 01:07:01,809 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 4000, best=0.91, avg=0.91, std=0.00, steps=3.278e+07
2023-07-07 01:07:09,355 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 4100, best=0.91, avg=0.91, std=0.00, steps=3.360e+07
2023-07-07 01:07:16,908 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 4200, best=0.91, avg=0.91, std=0.00, steps=3.441e+07
2023-07-07 01:07:24,458 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 4300, best=0.92, avg=0.91, std=0.00, steps=3.523e+07
2023-07-07 01:07:32,030 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 4400, best=0.91, avg=0.91, std=0.00, steps=3.605e+07
2023-07-07 01:07:39,650 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 4500, best=0.92, avg=0.91, std=0.00, steps=3.687e+07
2023-07-07 01:07:47,201 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 4600, best=0.91, avg=0.91, std=0.00, steps=3.769e+07
2023-07-07 01:07:54,755 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 4700, best=0.92, avg=0.91, std=0.00, steps=3.851e+07
2023-07-07 01:08:02,306 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 4800, best=0.92, avg=0.91, std=0.00, steps=3.933e+07
2023-07-07 01:08:09,852 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 4900, best=0.91, avg=0.91, std=0.00, steps=4.015e+07
2023-07-07 01:08:17,409 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 5000, best=0.92, avg=0.91, std=0.00, steps=4.097e+07
2023-07-07 01:08:24,975 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 5100, best=0.91, avg=0.91, std=0.00, steps=4.179e+07
2023-07-07 01:08:32,545 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 5200, best=0.92, avg=0.91, std=0.00, steps=4.261e+07
2023-07-07 01:08:40,110 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 5300, best=0.92, avg=0.91, std=0.00, steps=4.343e+07
2023-07-07 01:08:47,678 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 5400, best=0.92, avg=0.91, std=0.00, steps=4.424e+07
2023-07-07 01:08:55,259 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 5500, best=0.92, avg=0.91, std=0.00, steps=4.506e+07
2023-07-07 01:09:02,874 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 5600, best=0.92, avg=0.91, std=0.00, steps=4.588e+07
2023-07-07 01:09:10,442 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 5700, best=0.92, avg=0.91, std=0.00, steps=4.670e+07
2023-07-07 01:09:18,008 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 5800, best=0.92, avg=0.91, std=0.00, steps=4.752e+07
2023-07-07 01:09:25,577 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 5900, best=0.92, avg=0.91, std=0.00, steps=4.834e+07
2023-07-07 01:09:33,141 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 6000, best=0.92, avg=0.91, std=0.00, steps=4.916e+07
2023-07-07 01:09:40,757 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 6100, best=0.92, avg=0.91, std=0.00, steps=4.998e+07
2023-07-07 01:09:48,332 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 6200, best=0.92, avg=0.91, std=0.00, steps=5.080e+07
2023-07-07 01:09:55,915 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 6300, best=0.92, avg=0.91, std=0.00, steps=5.162e+07
2023-07-07 01:10:03,474 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 6400, best=0.92, avg=0.91, std=0.00, steps=5.244e+07
2023-07-07 01:10:11,043 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 6500, best=0.92, avg=0.91, std=0.00, steps=5.326e+07
2023-07-07 01:10:18,619 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 6600, best=0.92, avg=0.91, std=0.00, steps=5.408e+07
2023-07-07 01:10:26,159 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 6700, best=0.92, avg=0.91, std=0.00, steps=5.489e+07
2023-07-07 01:10:33,723 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 6800, best=0.92, avg=0.91, std=0.00, steps=5.571e+07
2023-07-07 01:10:41,298 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 6900, best=0.92, avg=0.91, std=0.00, steps=5.653e+07
2023-07-07 01:10:48,905 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 7000, best=0.92, avg=0.91, std=0.00, steps=5.735e+07
2023-07-07 01:10:56,501 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 7100, best=0.92, avg=0.91, std=0.00, steps=5.817e+07
2023-07-07 01:11:04,105 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 7200, best=0.92, avg=0.91, std=0.00, steps=5.899e+07
2023-07-07 01:11:11,656 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 7300, best=0.92, avg=0.91, std=0.00, steps=5.981e+07
2023-07-07 01:11:19,209 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 7400, best=0.92, avg=0.91, std=0.00, steps=6.063e+07
2023-07-07 01:11:26,792 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 7500, best=0.92, avg=0.91, std=0.00, steps=6.145e+07
2023-07-07 01:11:34,358 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 7600, best=0.92, avg=0.91, std=0.00, steps=6.227e+07
2023-07-07 01:11:41,926 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 7700, best=0.92, avg=0.91, std=0.00, steps=6.309e+07
2023-07-07 01:11:49,497 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 7800, best=0.92, avg=0.91, std=0.00, steps=6.391e+07
2023-07-07 01:11:57,083 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 7900, best=0.92, avg=0.91, std=0.00, steps=6.472e+07
2023-07-07 01:12:04,660 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 8000, best=0.92, avg=0.91, std=0.00, steps=6.554e+07
2023-07-07 01:12:12,211 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 8100, best=0.92, avg=0.91, std=0.00, steps=6.636e+07
2023-07-07 01:12:19,767 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 8200, best=0.92, avg=0.91, std=0.00, steps=6.718e+07
2023-07-07 01:12:27,328 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 8300, best=0.92, avg=0.91, std=0.00, steps=6.800e+07
2023-07-07 01:12:34,888 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 8400, best=0.92, avg=0.91, std=0.00, steps=6.882e+07
2023-07-07 01:12:42,436 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 8500, best=0.92, avg=0.91, std=0.00, steps=6.964e+07
2023-07-07 01:12:49,989 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 8600, best=0.92, avg=0.91, std=0.00, steps=7.046e+07
2023-07-07 01:12:57,592 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 8700, best=0.92, avg=0.91, std=0.00, steps=7.128e+07
2023-07-07 01:13:05,147 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 8800, best=0.92, avg=0.91, std=0.00, steps=7.210e+07
2023-07-07 01:13:12,704 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 8900, best=0.92, avg=0.91, std=0.00, steps=7.292e+07
2023-07-07 01:13:20,270 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 9000, best=0.92, avg=0.91, std=0.00, steps=7.374e+07
2023-07-07 01:13:27,830 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 9100, best=0.92, avg=0.91, std=0.00, steps=7.456e+07
2023-07-07 01:13:35,437 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 9200, best=0.92, avg=0.92, std=0.00, steps=7.537e+07
2023-07-07 01:13:43,019 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 9300, best=0.92, avg=0.92, std=0.00, steps=7.619e+07
2023-07-07 01:13:50,573 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 9400, best=0.92, avg=0.92, std=0.00, steps=7.701e+07
2023-07-07 01:13:58,132 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 9500, best=0.92, avg=0.92, std=0.00, steps=7.783e+07
2023-07-07 01:14:05,703 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 9600, best=0.92, avg=0.92, std=0.00, steps=7.865e+07
2023-07-07 01:14:13,255 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 9700, best=0.93, avg=0.92, std=0.00, steps=7.947e+07
2023-07-07 01:14:20,788 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 9800, best=0.92, avg=0.92, std=0.00, steps=8.029e+07
2023-07-07 01:14:28,382 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 9900, best=0.93, avg=0.92, std=0.00, steps=8.111e+07
2023-07-07 01:14:35,972 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 10000, best=0.93, avg=0.92, std=0.00, steps=8.193e+07
2023-07-07 01:14:43,560 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 10100, best=0.93, avg=0.92, std=0.00, steps=8.275e+07
2023-07-07 01:14:51,114 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 10200, best=0.93, avg=0.92, std=0.00, steps=8.357e+07
2023-07-07 01:14:58,695 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 10300, best=0.93, avg=0.92, std=0.00, steps=8.439e+07
2023-07-07 01:15:06,253 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 10400, best=0.93, avg=0.92, std=0.00, steps=8.520e+07
2023-07-07 01:15:13,803 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 10500, best=0.93, avg=0.92, std=0.00, steps=8.602e+07
2023-07-07 01:15:21,367 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 10600, best=0.93, avg=0.93, std=0.00, steps=8.684e+07
2023-07-07 01:15:28,939 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 10700, best=0.93, avg=0.92, std=0.00, steps=8.766e+07
2023-07-07 01:15:36,548 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 10800, best=0.93, avg=0.93, std=0.00, steps=8.848e+07
2023-07-07 01:15:44,137 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 10900, best=0.93, avg=0.93, std=0.00, steps=8.930e+07
2023-07-07 01:15:51,735 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 11000, best=0.93, avg=0.93, std=0.00, steps=9.012e+07
2023-07-07 01:15:59,327 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 11100, best=0.93, avg=0.93, std=0.00, steps=9.094e+07
2023-07-07 01:16:06,885 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 11200, best=0.93, avg=0.93, std=0.00, steps=9.176e+07
2023-07-07 01:16:14,439 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 11300, best=0.93, avg=0.93, std=0.00, steps=9.258e+07
2023-07-07 01:16:22,003 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 11400, best=0.93, avg=0.93, std=0.00, steps=9.340e+07
2023-07-07 01:16:29,568 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 11500, best=0.93, avg=0.93, std=0.00, steps=9.422e+07
2023-07-07 01:16:37,178 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 11600, best=0.93, avg=0.93, std=0.00, steps=9.504e+07
2023-07-07 01:16:44,818 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 11700, best=0.94, avg=0.93, std=0.00, steps=9.585e+07
2023-07-07 01:16:52,428 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 11800, best=0.94, avg=0.93, std=0.00, steps=9.667e+07
2023-07-07 01:17:00,043 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 11900, best=0.94, avg=0.93, std=0.00, steps=9.749e+07
2023-07-07 01:17:07,567 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 0, [Train]: 11999, best=0.93, avg=0.93, std=0.00, steps=9.830e+07
2023-07-07 01:17:07,568 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 01:17:07,594 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 01:17:07,623 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 01:17:19,176 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 100, best=0.51, avg=0.50, std=0.01, steps=1.034e+06
2023-07-07 01:17:28,522 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 200, best=0.51, avg=0.50, std=0.01, steps=2.058e+06
2023-07-07 01:17:37,857 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 300, best=0.52, avg=0.50, std=0.01, steps=3.082e+06
2023-07-07 01:17:47,255 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 400, best=0.51, avg=0.50, std=0.01, steps=4.106e+06
2023-07-07 01:17:56,641 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 500, best=0.51, avg=0.50, std=0.01, steps=5.130e+06
2023-07-07 01:18:06,020 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 600, best=0.51, avg=0.50, std=0.01, steps=6.154e+06
2023-07-07 01:18:15,402 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 700, best=0.51, avg=0.50, std=0.01, steps=7.178e+06
2023-07-07 01:18:24,778 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 800, best=0.51, avg=0.50, std=0.01, steps=8.202e+06
2023-07-07 01:18:34,145 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 900, best=0.52, avg=0.50, std=0.01, steps=9.226e+06
2023-07-07 01:18:43,523 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 1000, best=0.51, avg=0.50, std=0.01, steps=1.025e+07
2023-07-07 01:18:52,986 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 1100, best=0.52, avg=0.50, std=0.01, steps=1.127e+07
2023-07-07 01:19:02,460 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 1200, best=0.52, avg=0.50, std=0.01, steps=1.230e+07
2023-07-07 01:19:11,816 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 1300, best=0.51, avg=0.50, std=0.01, steps=1.332e+07
2023-07-07 01:19:21,224 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 1400, best=0.51, avg=0.50, std=0.01, steps=1.435e+07
2023-07-07 01:19:30,605 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 1500, best=0.51, avg=0.50, std=0.01, steps=1.537e+07
2023-07-07 01:19:40,030 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 1600, best=0.51, avg=0.50, std=0.00, steps=1.639e+07
2023-07-07 01:19:49,410 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 1700, best=0.51, avg=0.50, std=0.01, steps=1.742e+07
2023-07-07 01:19:58,772 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 1800, best=0.52, avg=0.50, std=0.01, steps=1.844e+07
2023-07-07 01:20:08,158 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 1900, best=0.52, avg=0.50, std=0.01, steps=1.947e+07
2023-07-07 01:20:17,573 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 2000, best=0.51, avg=0.50, std=0.01, steps=2.049e+07
2023-07-07 01:20:26,943 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 2100, best=0.51, avg=0.50, std=0.01, steps=2.151e+07
2023-07-07 01:20:36,318 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 2200, best=0.51, avg=0.50, std=0.00, steps=2.254e+07
2023-07-07 01:20:45,675 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 2300, best=0.52, avg=0.50, std=0.01, steps=2.356e+07
2023-07-07 01:20:55,034 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 2400, best=0.52, avg=0.50, std=0.01, steps=2.459e+07
2023-07-07 01:21:04,427 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 2500, best=0.51, avg=0.50, std=0.01, steps=2.561e+07
2023-07-07 01:21:13,792 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 2600, best=0.51, avg=0.50, std=0.01, steps=2.663e+07
2023-07-07 01:21:23,186 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 2700, best=0.52, avg=0.50, std=0.01, steps=2.766e+07
2023-07-07 01:21:32,586 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 2800, best=0.52, avg=0.50, std=0.01, steps=2.868e+07
2023-07-07 01:21:41,990 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 2900, best=0.51, avg=0.50, std=0.01, steps=2.971e+07
2023-07-07 01:21:51,398 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 3000, best=0.52, avg=0.50, std=0.01, steps=3.073e+07
2023-07-07 01:22:00,804 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 3100, best=0.51, avg=0.50, std=0.01, steps=3.175e+07
2023-07-07 01:22:10,253 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 3200, best=0.52, avg=0.50, std=0.01, steps=3.278e+07
2023-07-07 01:22:19,637 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 3300, best=0.51, avg=0.50, std=0.01, steps=3.380e+07
2023-07-07 01:22:29,013 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 3400, best=0.51, avg=0.50, std=0.01, steps=3.483e+07
2023-07-07 01:22:38,384 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 3500, best=0.51, avg=0.50, std=0.01, steps=3.585e+07
2023-07-07 01:22:47,770 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 3600, best=0.52, avg=0.50, std=0.01, steps=3.687e+07
2023-07-07 01:22:57,141 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 3700, best=0.51, avg=0.50, std=0.01, steps=3.790e+07
2023-07-07 01:23:06,574 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 3800, best=0.51, avg=0.50, std=0.01, steps=3.892e+07
2023-07-07 01:23:15,958 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 3900, best=0.51, avg=0.50, std=0.01, steps=3.995e+07
2023-07-07 01:23:25,332 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 4000, best=0.52, avg=0.50, std=0.01, steps=4.097e+07
2023-07-07 01:23:34,698 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 4100, best=0.51, avg=0.50, std=0.01, steps=4.199e+07
2023-07-07 01:23:44,060 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 4200, best=0.51, avg=0.50, std=0.00, steps=4.302e+07
2023-07-07 01:23:53,431 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 4300, best=0.52, avg=0.50, std=0.01, steps=4.404e+07
2023-07-07 01:24:02,856 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 4400, best=0.52, avg=0.50, std=0.01, steps=4.507e+07
2023-07-07 01:24:12,253 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 4500, best=0.52, avg=0.50, std=0.01, steps=4.609e+07
2023-07-07 01:24:21,646 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 4600, best=0.51, avg=0.50, std=0.01, steps=4.711e+07
2023-07-07 01:24:31,030 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 4700, best=0.51, avg=0.50, std=0.01, steps=4.814e+07
2023-07-07 01:24:40,408 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 4800, best=0.52, avg=0.50, std=0.01, steps=4.916e+07
2023-07-07 01:24:49,826 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 4900, best=0.52, avg=0.50, std=0.01, steps=5.019e+07
2023-07-07 01:24:59,207 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 5000, best=0.51, avg=0.50, std=0.01, steps=5.121e+07
2023-07-07 01:25:08,587 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 5100, best=0.52, avg=0.50, std=0.01, steps=5.223e+07
2023-07-07 01:25:17,977 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 5200, best=0.51, avg=0.50, std=0.01, steps=5.326e+07
2023-07-07 01:25:27,370 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 5300, best=0.51, avg=0.50, std=0.01, steps=5.428e+07
2023-07-07 01:25:36,764 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 5400, best=0.51, avg=0.50, std=0.01, steps=5.531e+07
2023-07-07 01:25:46,209 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 5500, best=0.51, avg=0.50, std=0.01, steps=5.633e+07
2023-07-07 01:25:55,663 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 5600, best=0.52, avg=0.50, std=0.01, steps=5.735e+07
2023-07-07 01:26:05,073 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 5700, best=0.51, avg=0.50, std=0.01, steps=5.838e+07
2023-07-07 01:26:14,502 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 5800, best=0.51, avg=0.50, std=0.01, steps=5.940e+07
2023-07-07 01:26:23,906 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 5900, best=0.51, avg=0.50, std=0.01, steps=6.043e+07
2023-07-07 01:26:33,290 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 6000, best=0.51, avg=0.50, std=0.01, steps=6.145e+07
2023-07-07 01:26:42,697 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 6100, best=0.52, avg=0.50, std=0.01, steps=6.247e+07
2023-07-07 01:26:52,077 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 6200, best=0.51, avg=0.50, std=0.01, steps=6.350e+07
2023-07-07 01:27:01,513 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 6300, best=0.51, avg=0.50, std=0.01, steps=6.452e+07
2023-07-07 01:27:10,922 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 6400, best=0.51, avg=0.50, std=0.00, steps=6.555e+07
2023-07-07 01:27:20,345 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 6500, best=0.51, avg=0.50, std=0.01, steps=6.657e+07
2023-07-07 01:27:29,736 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 6600, best=0.51, avg=0.50, std=0.01, steps=6.759e+07
2023-07-07 01:27:39,133 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 6700, best=0.52, avg=0.50, std=0.01, steps=6.862e+07
2023-07-07 01:27:48,511 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 6800, best=0.51, avg=0.50, std=0.01, steps=6.964e+07
2023-07-07 01:27:57,884 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 6900, best=0.51, avg=0.50, std=0.01, steps=7.067e+07
2023-07-07 01:28:07,292 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 7000, best=0.51, avg=0.50, std=0.01, steps=7.169e+07
2023-07-07 01:28:16,702 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 7100, best=0.52, avg=0.50, std=0.01, steps=7.271e+07
2023-07-07 01:28:26,084 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 7200, best=0.51, avg=0.50, std=0.01, steps=7.374e+07
2023-07-07 01:28:35,446 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 7300, best=0.51, avg=0.50, std=0.01, steps=7.476e+07
2023-07-07 01:28:44,821 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 7400, best=0.51, avg=0.50, std=0.01, steps=7.579e+07
2023-07-07 01:28:54,185 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 7500, best=0.52, avg=0.50, std=0.01, steps=7.681e+07
2023-07-07 01:29:03,575 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 7600, best=0.51, avg=0.50, std=0.01, steps=7.783e+07
2023-07-07 01:29:12,956 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 7700, best=0.52, avg=0.50, std=0.01, steps=7.886e+07
2023-07-07 01:29:22,327 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 7800, best=0.51, avg=0.50, std=0.01, steps=7.988e+07
2023-07-07 01:29:31,718 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 7900, best=0.51, avg=0.50, std=0.01, steps=8.091e+07
2023-07-07 01:29:41,094 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 8000, best=0.52, avg=0.50, std=0.01, steps=8.193e+07
2023-07-07 01:29:50,523 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 8100, best=0.52, avg=0.50, std=0.01, steps=8.295e+07
2023-07-07 01:29:59,874 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 8200, best=0.51, avg=0.50, std=0.01, steps=8.398e+07
2023-07-07 01:30:09,230 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 8300, best=0.51, avg=0.50, std=0.01, steps=8.500e+07
2023-07-07 01:30:18,645 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 8400, best=0.52, avg=0.50, std=0.01, steps=8.603e+07
2023-07-07 01:30:27,996 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 8500, best=0.51, avg=0.50, std=0.01, steps=8.705e+07
2023-07-07 01:30:37,400 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 8600, best=0.51, avg=0.50, std=0.01, steps=8.807e+07
2023-07-07 01:30:46,755 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 8700, best=0.51, avg=0.50, std=0.01, steps=8.910e+07
2023-07-07 01:30:56,106 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 8800, best=0.51, avg=0.50, std=0.01, steps=9.012e+07
2023-07-07 01:31:05,486 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 8900, best=0.51, avg=0.50, std=0.01, steps=9.115e+07
2023-07-07 01:31:14,830 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 9000, best=0.52, avg=0.50, std=0.01, steps=9.217e+07
2023-07-07 01:31:24,181 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 9100, best=0.52, avg=0.50, std=0.01, steps=9.319e+07
2023-07-07 01:31:33,545 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 9200, best=0.51, avg=0.50, std=0.01, steps=9.422e+07
2023-07-07 01:31:42,926 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 9300, best=0.51, avg=0.50, std=0.01, steps=9.524e+07
2023-07-07 01:31:52,285 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 9400, best=0.51, avg=0.50, std=0.01, steps=9.627e+07
2023-07-07 01:32:01,642 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 9500, best=0.52, avg=0.50, std=0.01, steps=9.729e+07
2023-07-07 01:32:11,009 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 9600, best=0.51, avg=0.50, std=0.00, steps=9.831e+07
2023-07-07 01:32:20,439 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 9700, best=0.51, avg=0.50, std=0.01, steps=9.934e+07
2023-07-07 01:32:29,878 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 9800, best=0.51, avg=0.50, std=0.01, steps=1.004e+08
2023-07-07 01:32:39,305 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 9900, best=0.66, avg=0.65, std=0.00, steps=1.014e+08
2023-07-07 01:32:48,699 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 10000, best=0.68, avg=0.68, std=0.00, steps=1.024e+08
2023-07-07 01:32:58,058 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 10100, best=0.70, avg=0.69, std=0.00, steps=1.034e+08
2023-07-07 01:33:07,428 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 10200, best=0.71, avg=0.70, std=0.00, steps=1.045e+08
2023-07-07 01:33:16,836 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 10300, best=0.72, avg=0.70, std=0.00, steps=1.055e+08
2023-07-07 01:33:26,250 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 10400, best=0.72, avg=0.71, std=0.00, steps=1.065e+08
2023-07-07 01:33:35,606 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 10500, best=0.73, avg=0.72, std=0.00, steps=1.075e+08
2023-07-07 01:33:45,028 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 10600, best=0.73, avg=0.72, std=0.00, steps=1.086e+08
2023-07-07 01:33:54,406 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 10700, best=0.74, avg=0.73, std=0.00, steps=1.096e+08
2023-07-07 01:34:03,766 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 10800, best=0.75, avg=0.73, std=0.00, steps=1.106e+08
2023-07-07 01:34:13,132 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 10900, best=0.75, avg=0.74, std=0.00, steps=1.116e+08
2023-07-07 01:34:22,536 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 11000, best=0.75, avg=0.74, std=0.00, steps=1.127e+08
2023-07-07 01:34:31,900 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 11100, best=0.76, avg=0.75, std=0.00, steps=1.137e+08
2023-07-07 01:34:41,263 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 11200, best=0.76, avg=0.75, std=0.00, steps=1.147e+08
2023-07-07 01:34:50,631 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 11300, best=0.77, avg=0.75, std=0.00, steps=1.157e+08
2023-07-07 01:35:00,019 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 11400, best=0.77, avg=0.76, std=0.00, steps=1.167e+08
2023-07-07 01:35:09,472 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 11500, best=0.77, avg=0.76, std=0.00, steps=1.178e+08
2023-07-07 01:35:18,933 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 11600, best=0.77, avg=0.76, std=0.00, steps=1.188e+08
2023-07-07 01:35:28,350 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 11700, best=0.78, avg=0.77, std=0.00, steps=1.198e+08
2023-07-07 01:35:37,752 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 11800, best=0.78, avg=0.77, std=0.00, steps=1.208e+08
2023-07-07 01:35:47,151 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 11900, best=0.79, avg=0.77, std=0.00, steps=1.219e+08
2023-07-07 01:35:56,441 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 0, [Train]: 11999, best=0.79, avg=0.78, std=0.00, steps=1.229e+08
2023-07-07 01:35:56,442 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 01:35:56,465 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 01:35:56,497 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 01:36:09,861 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 100, best=0.51, avg=0.50, std=0.01, steps=1.241e+06
2023-07-07 01:36:21,126 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 200, best=0.51, avg=0.50, std=0.01, steps=2.470e+06
2023-07-07 01:36:32,356 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 300, best=0.52, avg=0.50, std=0.01, steps=3.699e+06
2023-07-07 01:36:43,571 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 400, best=0.51, avg=0.50, std=0.01, steps=4.927e+06
2023-07-07 01:36:54,830 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 500, best=0.51, avg=0.50, std=0.01, steps=6.156e+06
2023-07-07 01:37:06,020 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 600, best=0.51, avg=0.50, std=0.01, steps=7.385e+06
2023-07-07 01:37:17,305 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 700, best=0.51, avg=0.50, std=0.01, steps=8.614e+06
2023-07-07 01:37:28,515 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 800, best=0.51, avg=0.50, std=0.01, steps=9.843e+06
2023-07-07 01:37:39,725 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 900, best=0.52, avg=0.50, std=0.01, steps=1.107e+07
2023-07-07 01:37:50,953 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 1000, best=0.51, avg=0.50, std=0.01, steps=1.230e+07
2023-07-07 01:38:02,167 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 1100, best=0.52, avg=0.50, std=0.01, steps=1.353e+07
2023-07-07 01:38:13,375 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 1200, best=0.52, avg=0.50, std=0.01, steps=1.476e+07
2023-07-07 01:38:24,626 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 1300, best=0.51, avg=0.50, std=0.01, steps=1.599e+07
2023-07-07 01:38:35,839 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 1400, best=0.51, avg=0.50, std=0.01, steps=1.722e+07
2023-07-07 01:38:47,134 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 1500, best=0.51, avg=0.50, std=0.01, steps=1.844e+07
2023-07-07 01:38:58,413 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 1600, best=0.51, avg=0.50, std=0.00, steps=1.967e+07
2023-07-07 01:39:09,651 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 1700, best=0.51, avg=0.50, std=0.01, steps=2.090e+07
2023-07-07 01:39:20,927 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 1800, best=0.52, avg=0.50, std=0.01, steps=2.213e+07
2023-07-07 01:39:32,189 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 1900, best=0.52, avg=0.50, std=0.01, steps=2.336e+07
2023-07-07 01:39:43,415 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 2000, best=0.51, avg=0.50, std=0.01, steps=2.459e+07
2023-07-07 01:39:54,647 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 2100, best=0.51, avg=0.50, std=0.01, steps=2.582e+07
2023-07-07 01:40:05,859 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 2200, best=0.51, avg=0.50, std=0.00, steps=2.705e+07
2023-07-07 01:40:17,057 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 2300, best=0.52, avg=0.50, std=0.01, steps=2.827e+07
2023-07-07 01:40:28,258 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 2400, best=0.52, avg=0.50, std=0.01, steps=2.950e+07
2023-07-07 01:40:39,450 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 2500, best=0.51, avg=0.50, std=0.01, steps=3.073e+07
2023-07-07 01:40:50,649 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 2600, best=0.60, avg=0.59, std=0.00, steps=3.196e+07
2023-07-07 01:41:01,856 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 2700, best=0.62, avg=0.62, std=0.00, steps=3.319e+07
2023-07-07 01:41:13,067 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 2800, best=0.66, avg=0.64, std=0.00, steps=3.442e+07
2023-07-07 01:41:24,270 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 2900, best=0.66, avg=0.65, std=0.00, steps=3.565e+07
2023-07-07 01:41:35,499 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 3000, best=0.67, avg=0.66, std=0.00, steps=3.688e+07
2023-07-07 01:41:46,729 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 3100, best=0.68, avg=0.67, std=0.00, steps=3.811e+07
2023-07-07 01:41:57,941 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 3200, best=0.69, avg=0.68, std=0.00, steps=3.933e+07
2023-07-07 01:42:09,142 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 3300, best=0.70, avg=0.69, std=0.00, steps=4.056e+07
2023-07-07 01:42:20,346 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 3400, best=0.70, avg=0.69, std=0.00, steps=4.179e+07
2023-07-07 01:42:31,524 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 3500, best=0.71, avg=0.70, std=0.00, steps=4.302e+07
2023-07-07 01:42:42,742 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 3600, best=0.71, avg=0.70, std=0.00, steps=4.425e+07
2023-07-07 01:42:54,011 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 3700, best=0.71, avg=0.70, std=0.00, steps=4.548e+07
2023-07-07 01:43:05,261 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 3800, best=0.72, avg=0.71, std=0.00, steps=4.671e+07
2023-07-07 01:43:16,439 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 3900, best=0.72, avg=0.71, std=0.00, steps=4.794e+07
2023-07-07 01:43:27,617 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 4000, best=0.72, avg=0.71, std=0.00, steps=4.916e+07
2023-07-07 01:43:38,817 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 4100, best=0.73, avg=0.72, std=0.00, steps=5.039e+07
2023-07-07 01:43:50,025 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 4200, best=0.73, avg=0.72, std=0.00, steps=5.162e+07
2023-07-07 01:44:01,273 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 4300, best=0.74, avg=0.72, std=0.00, steps=5.285e+07
2023-07-07 01:44:12,470 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 4400, best=0.74, avg=0.73, std=0.00, steps=5.408e+07
2023-07-07 01:44:23,706 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 4500, best=0.74, avg=0.73, std=0.00, steps=5.531e+07
2023-07-07 01:44:34,967 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 4600, best=0.74, avg=0.73, std=0.00, steps=5.654e+07
2023-07-07 01:44:46,256 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 4700, best=0.74, avg=0.73, std=0.00, steps=5.777e+07
2023-07-07 01:44:57,488 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 4800, best=0.75, avg=0.74, std=0.00, steps=5.899e+07
2023-07-07 01:45:08,736 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 4900, best=0.75, avg=0.74, std=0.00, steps=6.022e+07
2023-07-07 01:45:19,956 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 5000, best=0.75, avg=0.74, std=0.00, steps=6.145e+07
2023-07-07 01:45:31,201 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 5100, best=0.75, avg=0.74, std=0.00, steps=6.268e+07
2023-07-07 01:45:42,475 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 5200, best=0.75, avg=0.74, std=0.00, steps=6.391e+07
2023-07-07 01:45:53,755 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 5300, best=0.76, avg=0.74, std=0.00, steps=6.514e+07
2023-07-07 01:46:05,000 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 5400, best=0.76, avg=0.74, std=0.00, steps=6.637e+07
2023-07-07 01:46:16,180 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 5500, best=0.76, avg=0.74, std=0.00, steps=6.760e+07
2023-07-07 01:46:27,443 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 5600, best=0.75, avg=0.75, std=0.00, steps=6.883e+07
2023-07-07 01:46:38,704 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 5700, best=0.76, avg=0.75, std=0.00, steps=7.005e+07
2023-07-07 01:46:49,883 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 5800, best=0.76, avg=0.75, std=0.00, steps=7.128e+07
2023-07-07 01:47:01,065 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 5900, best=0.76, avg=0.75, std=0.00, steps=7.251e+07
2023-07-07 01:47:12,250 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 6000, best=0.76, avg=0.75, std=0.00, steps=7.374e+07
2023-07-07 01:47:23,457 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 6100, best=0.76, avg=0.75, std=0.00, steps=7.497e+07
2023-07-07 01:47:34,661 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 6200, best=0.76, avg=0.75, std=0.00, steps=7.620e+07
2023-07-07 01:47:45,839 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 6300, best=0.76, avg=0.75, std=0.00, steps=7.743e+07
2023-07-07 01:47:57,043 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 6400, best=0.77, avg=0.75, std=0.00, steps=7.866e+07
2023-07-07 01:48:08,230 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 6500, best=0.76, avg=0.75, std=0.00, steps=7.988e+07
2023-07-07 01:48:19,401 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 6600, best=0.76, avg=0.76, std=0.00, steps=8.111e+07
2023-07-07 01:48:30,560 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 6700, best=0.77, avg=0.76, std=0.00, steps=8.234e+07
2023-07-07 01:48:41,857 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 6800, best=0.77, avg=0.76, std=0.00, steps=8.357e+07
2023-07-07 01:48:53,220 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 6900, best=0.77, avg=0.76, std=0.00, steps=8.480e+07
2023-07-07 01:49:04,441 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 7000, best=0.77, avg=0.76, std=0.00, steps=8.603e+07
2023-07-07 01:49:15,745 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 7100, best=0.77, avg=0.76, std=0.00, steps=8.726e+07
2023-07-07 01:49:27,013 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 7200, best=0.77, avg=0.76, std=0.00, steps=8.849e+07
2023-07-07 01:49:38,203 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 7300, best=0.77, avg=0.76, std=0.00, steps=8.971e+07
2023-07-07 01:49:49,430 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 7400, best=0.77, avg=0.76, std=0.00, steps=9.094e+07
2023-07-07 01:50:00,646 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 7500, best=0.77, avg=0.76, std=0.00, steps=9.217e+07
2023-07-07 01:50:11,836 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 7600, best=0.78, avg=0.77, std=0.00, steps=9.340e+07
2023-07-07 01:50:23,047 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 7700, best=0.78, avg=0.77, std=0.00, steps=9.463e+07
2023-07-07 01:50:34,290 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 7800, best=0.78, avg=0.77, std=0.00, steps=9.586e+07
2023-07-07 01:50:45,508 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 7900, best=0.78, avg=0.77, std=0.00, steps=9.709e+07
2023-07-07 01:50:56,686 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 8000, best=0.78, avg=0.77, std=0.00, steps=9.832e+07
2023-07-07 01:51:07,887 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 8100, best=0.78, avg=0.77, std=0.00, steps=9.955e+07
2023-07-07 01:51:19,092 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 8200, best=0.78, avg=0.77, std=0.00, steps=1.008e+08
2023-07-07 01:51:30,289 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 8300, best=0.78, avg=0.77, std=0.00, steps=1.020e+08
2023-07-07 01:51:41,492 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 8400, best=0.78, avg=0.77, std=0.00, steps=1.032e+08
2023-07-07 01:51:52,706 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 8500, best=0.78, avg=0.77, std=0.00, steps=1.045e+08
2023-07-07 01:52:03,927 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 8600, best=0.78, avg=0.77, std=0.00, steps=1.057e+08
2023-07-07 01:52:15,130 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 8700, best=0.78, avg=0.77, std=0.00, steps=1.069e+08
2023-07-07 01:52:26,323 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 8800, best=0.79, avg=0.78, std=0.00, steps=1.081e+08
2023-07-07 01:52:37,517 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 8900, best=0.79, avg=0.78, std=0.00, steps=1.094e+08
2023-07-07 01:52:48,706 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 9000, best=0.79, avg=0.78, std=0.00, steps=1.106e+08
2023-07-07 01:52:59,958 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 9100, best=0.79, avg=0.78, std=0.00, steps=1.118e+08
2023-07-07 01:53:11,143 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 9200, best=0.78, avg=0.78, std=0.00, steps=1.131e+08
2023-07-07 01:53:22,355 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 9300, best=0.79, avg=0.78, std=0.00, steps=1.143e+08
2023-07-07 01:53:33,600 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 9400, best=0.79, avg=0.78, std=0.00, steps=1.155e+08
2023-07-07 01:53:44,852 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 9500, best=0.79, avg=0.78, std=0.00, steps=1.167e+08
2023-07-07 01:53:56,047 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 9600, best=0.79, avg=0.78, std=0.00, steps=1.180e+08
2023-07-07 01:54:07,255 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 9700, best=0.79, avg=0.78, std=0.00, steps=1.192e+08
2023-07-07 01:54:18,461 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 9800, best=0.79, avg=0.78, std=0.00, steps=1.204e+08
2023-07-07 01:54:29,652 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 9900, best=0.79, avg=0.78, std=0.00, steps=1.217e+08
2023-07-07 01:54:40,857 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 10000, best=0.79, avg=0.78, std=0.00, steps=1.229e+08
2023-07-07 01:54:52,061 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 10100, best=0.79, avg=0.78, std=0.00, steps=1.241e+08
2023-07-07 01:55:03,320 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 10200, best=0.79, avg=0.78, std=0.00, steps=1.253e+08
2023-07-07 01:55:14,560 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 10300, best=0.80, avg=0.78, std=0.00, steps=1.266e+08
2023-07-07 01:55:25,824 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 10400, best=0.79, avg=0.78, std=0.00, steps=1.278e+08
2023-07-07 01:55:37,063 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 10500, best=0.79, avg=0.79, std=0.00, steps=1.290e+08
2023-07-07 01:55:48,328 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 10600, best=0.79, avg=0.78, std=0.00, steps=1.303e+08
2023-07-07 01:55:59,555 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 10700, best=0.79, avg=0.78, std=0.00, steps=1.315e+08
2023-07-07 01:56:10,824 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 10800, best=0.79, avg=0.79, std=0.00, steps=1.327e+08
2023-07-07 01:56:22,015 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 10900, best=0.79, avg=0.79, std=0.00, steps=1.340e+08
2023-07-07 01:56:33,187 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 11000, best=0.80, avg=0.79, std=0.00, steps=1.352e+08
2023-07-07 01:56:44,364 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 11100, best=0.79, avg=0.79, std=0.00, steps=1.364e+08
2023-07-07 01:56:55,611 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 11200, best=0.80, avg=0.79, std=0.00, steps=1.376e+08
2023-07-07 01:57:06,886 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 11300, best=0.80, avg=0.79, std=0.00, steps=1.389e+08
2023-07-07 01:57:18,139 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 11400, best=0.80, avg=0.79, std=0.00, steps=1.401e+08
2023-07-07 01:57:29,403 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 11500, best=0.80, avg=0.79, std=0.00, steps=1.413e+08
2023-07-07 01:57:40,575 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 11600, best=0.80, avg=0.79, std=0.00, steps=1.426e+08
2023-07-07 01:57:51,753 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 11700, best=0.80, avg=0.79, std=0.00, steps=1.438e+08
2023-07-07 01:58:02,923 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 11800, best=0.80, avg=0.79, std=0.00, steps=1.450e+08
2023-07-07 01:58:14,095 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 11900, best=0.80, avg=0.79, std=0.00, steps=1.462e+08
2023-07-07 01:58:25,183 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 0, [Train]: 11999, best=0.80, avg=0.79, std=0.00, steps=1.475e+08
2023-07-07 01:58:25,183 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 01:58:25,209 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 01:58:25,242 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 01:58:42,233 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 100, best=0.51, avg=0.50, std=0.01, steps=1.655e+06
2023-07-07 01:58:57,179 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 200, best=0.51, avg=0.50, std=0.01, steps=3.293e+06
2023-07-07 01:59:12,050 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 300, best=0.52, avg=0.50, std=0.01, steps=4.932e+06
2023-07-07 01:59:26,946 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 400, best=0.51, avg=0.50, std=0.01, steps=6.570e+06
2023-07-07 01:59:41,824 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 500, best=0.51, avg=0.50, std=0.01, steps=8.208e+06
2023-07-07 01:59:56,739 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 600, best=0.51, avg=0.50, std=0.01, steps=9.847e+06
2023-07-07 02:00:11,631 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 700, best=0.51, avg=0.50, std=0.01, steps=1.149e+07
2023-07-07 02:00:26,527 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 800, best=0.51, avg=0.50, std=0.01, steps=1.312e+07
2023-07-07 02:00:41,436 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 900, best=0.52, avg=0.50, std=0.01, steps=1.476e+07
2023-07-07 02:00:56,338 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 1000, best=0.51, avg=0.50, std=0.01, steps=1.640e+07
2023-07-07 02:01:11,212 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 1100, best=0.52, avg=0.50, std=0.01, steps=1.804e+07
2023-07-07 02:01:26,064 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 1200, best=0.52, avg=0.50, std=0.01, steps=1.968e+07
2023-07-07 02:01:40,991 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 1300, best=0.51, avg=0.50, std=0.01, steps=2.132e+07
2023-07-07 02:01:55,891 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 1400, best=0.51, avg=0.50, std=0.01, steps=2.295e+07
2023-07-07 02:02:10,850 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 1500, best=0.52, avg=0.50, std=0.01, steps=2.459e+07
2023-07-07 02:02:25,733 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 1600, best=0.51, avg=0.50, std=0.00, steps=2.623e+07
2023-07-07 02:02:40,692 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 1700, best=0.51, avg=0.50, std=0.01, steps=2.787e+07
2023-07-07 02:02:55,641 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 1800, best=0.51, avg=0.50, std=0.01, steps=2.951e+07
2023-07-07 02:03:10,474 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 1900, best=0.51, avg=0.50, std=0.01, steps=3.115e+07
2023-07-07 02:03:25,293 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 2000, best=0.51, avg=0.50, std=0.01, steps=3.278e+07
2023-07-07 02:03:40,143 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 2100, best=0.52, avg=0.50, std=0.01, steps=3.442e+07
2023-07-07 02:03:55,079 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 2200, best=0.51, avg=0.50, std=0.00, steps=3.606e+07
2023-07-07 02:04:09,966 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 2300, best=0.52, avg=0.50, std=0.01, steps=3.770e+07
2023-07-07 02:04:24,838 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 2400, best=0.51, avg=0.50, std=0.01, steps=3.934e+07
2023-07-07 02:04:39,718 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 2500, best=0.51, avg=0.50, std=0.01, steps=4.098e+07
2023-07-07 02:04:54,594 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 2600, best=0.51, avg=0.50, std=0.01, steps=4.261e+07
2023-07-07 02:05:09,563 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 2700, best=0.51, avg=0.50, std=0.01, steps=4.425e+07
2023-07-07 02:05:24,547 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 2800, best=0.52, avg=0.50, std=0.01, steps=4.589e+07
2023-07-07 02:05:39,486 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 2900, best=0.52, avg=0.50, std=0.01, steps=4.753e+07
2023-07-07 02:05:54,327 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 3000, best=0.51, avg=0.50, std=0.01, steps=4.917e+07
2023-07-07 02:06:09,207 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 3100, best=0.51, avg=0.50, std=0.01, steps=5.081e+07
2023-07-07 02:06:24,065 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 3200, best=0.51, avg=0.50, std=0.01, steps=5.245e+07
2023-07-07 02:06:38,924 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 3300, best=0.51, avg=0.50, std=0.01, steps=5.408e+07
2023-07-07 02:06:53,777 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 3400, best=0.51, avg=0.50, std=0.01, steps=5.572e+07
2023-07-07 02:07:08,624 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 3500, best=0.51, avg=0.50, std=0.01, steps=5.736e+07
2023-07-07 02:07:23,504 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 3600, best=0.52, avg=0.50, std=0.01, steps=5.900e+07
2023-07-07 02:07:38,349 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 3700, best=0.51, avg=0.50, std=0.01, steps=6.064e+07
2023-07-07 02:07:53,239 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 3800, best=0.51, avg=0.50, std=0.01, steps=6.228e+07
2023-07-07 02:08:08,105 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 3900, best=0.51, avg=0.50, std=0.01, steps=6.391e+07
2023-07-07 02:08:22,964 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 4000, best=0.52, avg=0.50, std=0.01, steps=6.555e+07
2023-07-07 02:08:37,808 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 4100, best=0.52, avg=0.50, std=0.01, steps=6.719e+07
2023-07-07 02:08:52,702 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 4200, best=0.51, avg=0.50, std=0.00, steps=6.883e+07
2023-07-07 02:09:07,571 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 4300, best=0.51, avg=0.50, std=0.01, steps=7.047e+07
2023-07-07 02:09:22,452 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 4400, best=0.52, avg=0.50, std=0.01, steps=7.211e+07
2023-07-07 02:09:37,352 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 4500, best=0.51, avg=0.50, std=0.01, steps=7.374e+07
2023-07-07 02:09:52,194 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 4600, best=0.52, avg=0.50, std=0.01, steps=7.538e+07
2023-07-07 02:10:07,014 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 4700, best=0.52, avg=0.50, std=0.01, steps=7.702e+07
2023-07-07 02:10:21,847 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 4800, best=0.51, avg=0.50, std=0.01, steps=7.866e+07
2023-07-07 02:10:36,683 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 4900, best=0.51, avg=0.50, std=0.01, steps=8.030e+07
2023-07-07 02:10:51,554 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 5000, best=0.51, avg=0.50, std=0.01, steps=8.194e+07
2023-07-07 02:11:06,452 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 5100, best=0.51, avg=0.50, std=0.01, steps=8.357e+07
2023-07-07 02:11:21,328 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 5200, best=0.52, avg=0.50, std=0.01, steps=8.521e+07
2023-07-07 02:11:36,203 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 5300, best=0.52, avg=0.50, std=0.01, steps=8.685e+07
2023-07-07 02:11:51,071 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 5400, best=0.51, avg=0.50, std=0.01, steps=8.849e+07
2023-07-07 02:12:05,968 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 5500, best=0.52, avg=0.50, std=0.01, steps=9.013e+07
2023-07-07 02:12:20,846 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 5600, best=0.51, avg=0.50, std=0.01, steps=9.177e+07
2023-07-07 02:12:35,746 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 5700, best=0.51, avg=0.50, std=0.01, steps=9.341e+07
2023-07-07 02:12:50,611 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 5800, best=0.51, avg=0.50, std=0.01, steps=9.504e+07
2023-07-07 02:13:05,436 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 5900, best=0.51, avg=0.50, std=0.01, steps=9.668e+07
2023-07-07 02:13:20,309 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 6000, best=0.51, avg=0.50, std=0.01, steps=9.832e+07
2023-07-07 02:13:35,248 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 6100, best=0.51, avg=0.50, std=0.01, steps=9.996e+07
2023-07-07 02:13:50,204 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 6200, best=0.52, avg=0.50, std=0.01, steps=1.016e+08
2023-07-07 02:14:05,159 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 6300, best=0.52, avg=0.50, std=0.01, steps=1.032e+08
2023-07-07 02:14:20,052 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 6400, best=0.51, avg=0.50, std=0.00, steps=1.049e+08
2023-07-07 02:14:34,948 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 6500, best=0.51, avg=0.50, std=0.01, steps=1.065e+08
2023-07-07 02:14:49,821 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 6600, best=0.51, avg=0.50, std=0.01, steps=1.082e+08
2023-07-07 02:15:04,683 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 6700, best=0.52, avg=0.50, std=0.01, steps=1.098e+08
2023-07-07 02:15:19,532 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 6800, best=0.51, avg=0.50, std=0.01, steps=1.114e+08
2023-07-07 02:15:34,449 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 6900, best=0.51, avg=0.50, std=0.01, steps=1.131e+08
2023-07-07 02:15:49,322 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 7000, best=0.51, avg=0.50, std=0.01, steps=1.147e+08
2023-07-07 02:16:04,311 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 7100, best=0.52, avg=0.50, std=0.01, steps=1.163e+08
2023-07-07 02:16:19,194 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 7200, best=0.52, avg=0.50, std=0.01, steps=1.180e+08
2023-07-07 02:16:34,103 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 7300, best=0.52, avg=0.50, std=0.01, steps=1.196e+08
2023-07-07 02:16:48,948 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 7400, best=0.51, avg=0.50, std=0.01, steps=1.213e+08
2023-07-07 02:17:03,805 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 7500, best=0.51, avg=0.50, std=0.01, steps=1.229e+08
2023-07-07 02:17:18,643 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 7600, best=0.52, avg=0.50, std=0.01, steps=1.245e+08
2023-07-07 02:17:33,486 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 7700, best=0.51, avg=0.50, std=0.01, steps=1.262e+08
2023-07-07 02:17:48,365 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 7800, best=0.51, avg=0.50, std=0.01, steps=1.278e+08
2023-07-07 02:18:03,282 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 7900, best=0.52, avg=0.50, std=0.01, steps=1.294e+08
2023-07-07 02:18:18,289 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 8000, best=0.51, avg=0.50, std=0.01, steps=1.311e+08
2023-07-07 02:18:33,270 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 8100, best=0.52, avg=0.50, std=0.01, steps=1.327e+08
2023-07-07 02:18:48,205 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 8200, best=0.51, avg=0.50, std=0.01, steps=1.344e+08
2023-07-07 02:19:03,161 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 8300, best=0.51, avg=0.50, std=0.01, steps=1.360e+08
2023-07-07 02:19:18,130 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 8400, best=0.51, avg=0.50, std=0.01, steps=1.376e+08
2023-07-07 02:19:33,015 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 8500, best=0.51, avg=0.50, std=0.01, steps=1.393e+08
2023-07-07 02:19:47,891 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 8600, best=0.52, avg=0.50, std=0.01, steps=1.409e+08
2023-07-07 02:20:02,775 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 8700, best=0.51, avg=0.50, std=0.01, steps=1.426e+08
2023-07-07 02:20:17,675 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 8800, best=0.51, avg=0.50, std=0.01, steps=1.442e+08
2023-07-07 02:20:32,771 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 8900, best=0.52, avg=0.50, std=0.01, steps=1.458e+08
2023-07-07 02:20:47,699 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 9000, best=0.51, avg=0.50, std=0.01, steps=1.475e+08
2023-07-07 02:21:02,567 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 9100, best=0.51, avg=0.50, std=0.01, steps=1.491e+08
2023-07-07 02:21:17,468 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 9200, best=0.51, avg=0.50, std=0.01, steps=1.507e+08
2023-07-07 02:21:32,358 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 9300, best=0.52, avg=0.50, std=0.01, steps=1.524e+08
2023-07-07 02:21:47,192 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 9400, best=0.51, avg=0.50, std=0.01, steps=1.540e+08
2023-07-07 02:22:02,034 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 9500, best=0.51, avg=0.50, std=0.01, steps=1.557e+08
2023-07-07 02:22:16,940 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 9600, best=0.52, avg=0.50, std=0.00, steps=1.573e+08
2023-07-07 02:22:31,900 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 9700, best=0.51, avg=0.50, std=0.01, steps=1.589e+08
2023-07-07 02:22:46,834 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 9800, best=0.52, avg=0.50, std=0.01, steps=1.606e+08
2023-07-07 02:23:01,679 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 9900, best=0.51, avg=0.50, std=0.01, steps=1.622e+08
2023-07-07 02:23:16,535 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 10000, best=0.51, avg=0.50, std=0.01, steps=1.639e+08
2023-07-07 02:23:31,380 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 10100, best=0.51, avg=0.50, std=0.01, steps=1.655e+08
2023-07-07 02:23:46,205 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 10200, best=0.52, avg=0.50, std=0.01, steps=1.671e+08
2023-07-07 02:24:01,141 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 10300, best=0.52, avg=0.50, std=0.01, steps=1.688e+08
2023-07-07 02:24:16,014 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 10400, best=0.51, avg=0.50, std=0.01, steps=1.704e+08
2023-07-07 02:24:30,859 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 10500, best=0.52, avg=0.50, std=0.01, steps=1.720e+08
2023-07-07 02:24:45,722 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 10600, best=0.51, avg=0.50, std=0.01, steps=1.737e+08
2023-07-07 02:25:00,678 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 10700, best=0.51, avg=0.50, std=0.01, steps=1.753e+08
2023-07-07 02:25:15,661 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 10800, best=0.52, avg=0.50, std=0.01, steps=1.770e+08
2023-07-07 02:25:30,511 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 10900, best=0.52, avg=0.50, std=0.01, steps=1.786e+08
2023-07-07 02:25:45,356 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 11000, best=0.51, avg=0.50, std=0.01, steps=1.802e+08
2023-07-07 02:26:00,239 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 11100, best=0.52, avg=0.50, std=0.01, steps=1.819e+08
2023-07-07 02:26:15,132 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 11200, best=0.51, avg=0.50, std=0.01, steps=1.835e+08
2023-07-07 02:26:30,007 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 11300, best=0.51, avg=0.50, std=0.00, steps=1.852e+08
2023-07-07 02:26:44,874 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 11400, best=0.51, avg=0.50, std=0.01, steps=1.868e+08
2023-07-07 02:26:59,755 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 11500, best=0.51, avg=0.50, std=0.01, steps=1.884e+08
2023-07-07 02:27:14,628 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 11600, best=0.51, avg=0.50, std=0.01, steps=1.901e+08
2023-07-07 02:27:29,529 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 11700, best=0.51, avg=0.50, std=0.01, steps=1.917e+08
2023-07-07 02:27:44,397 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 11800, best=0.52, avg=0.50, std=0.01, steps=1.933e+08
2023-07-07 02:27:59,269 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 11900, best=0.51, avg=0.50, std=0.01, steps=1.950e+08
2023-07-07 02:28:14,008 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 0, [Train]: 11999, best=0.51, avg=0.50, std=0.01, steps=1.966e+08
2023-07-07 02:28:14,008 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 02:28:14,032 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 02:28:14,062 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 02:28:31,090 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 100, best=0.51, avg=0.50, std=0.00, steps=1.655e+06
2023-07-07 02:28:45,985 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 200, best=0.62, avg=0.61, std=0.00, steps=3.293e+06
2023-07-07 02:29:00,894 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 300, best=0.65, avg=0.64, std=0.00, steps=4.932e+06
2023-07-07 02:29:15,766 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 400, best=0.67, avg=0.66, std=0.00, steps=6.570e+06
2023-07-07 02:29:30,665 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 500, best=0.68, avg=0.67, std=0.00, steps=8.208e+06
2023-07-07 02:29:45,557 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 600, best=0.69, avg=0.68, std=0.00, steps=9.847e+06
2023-07-07 02:30:00,456 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 700, best=0.69, avg=0.69, std=0.00, steps=1.149e+07
2023-07-07 02:30:15,343 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 800, best=0.70, avg=0.69, std=0.00, steps=1.312e+07
2023-07-07 02:30:30,211 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 900, best=0.71, avg=0.70, std=0.00, steps=1.476e+07
2023-07-07 02:30:45,072 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 1000, best=0.71, avg=0.70, std=0.00, steps=1.640e+07
2023-07-07 02:30:59,918 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 1100, best=0.71, avg=0.71, std=0.00, steps=1.804e+07
2023-07-07 02:31:14,764 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 1200, best=0.71, avg=0.71, std=0.00, steps=1.968e+07
2023-07-07 02:31:29,617 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 1300, best=0.72, avg=0.71, std=0.00, steps=2.132e+07
2023-07-07 02:31:44,540 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 1400, best=0.72, avg=0.71, std=0.00, steps=2.295e+07
2023-07-07 02:31:59,417 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 1500, best=0.72, avg=0.72, std=0.00, steps=2.459e+07
2023-07-07 02:32:14,268 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 1600, best=0.73, avg=0.72, std=0.00, steps=2.623e+07
2023-07-07 02:32:29,193 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 1700, best=0.73, avg=0.72, std=0.00, steps=2.787e+07
2023-07-07 02:32:44,072 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 1800, best=0.73, avg=0.72, std=0.00, steps=2.951e+07
2023-07-07 02:32:58,915 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 1900, best=0.73, avg=0.72, std=0.00, steps=3.115e+07
2023-07-07 02:33:13,751 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 2000, best=0.73, avg=0.73, std=0.00, steps=3.278e+07
2023-07-07 02:33:28,590 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 2100, best=0.73, avg=0.73, std=0.00, steps=3.442e+07
2023-07-07 02:33:43,481 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 2200, best=0.73, avg=0.73, std=0.00, steps=3.606e+07
2023-07-07 02:33:58,434 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 2300, best=0.74, avg=0.73, std=0.00, steps=3.770e+07
2023-07-07 02:34:13,297 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 2400, best=0.74, avg=0.73, std=0.00, steps=3.934e+07
2023-07-07 02:34:28,172 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 2500, best=0.74, avg=0.73, std=0.00, steps=4.098e+07
2023-07-07 02:34:43,054 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 2600, best=0.74, avg=0.73, std=0.00, steps=4.261e+07
2023-07-07 02:34:57,935 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 2700, best=0.74, avg=0.74, std=0.00, steps=4.425e+07
2023-07-07 02:35:12,845 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 2800, best=0.75, avg=0.74, std=0.00, steps=4.589e+07
2023-07-07 02:35:27,762 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 2900, best=0.75, avg=0.74, std=0.00, steps=4.753e+07
2023-07-07 02:35:42,739 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 3000, best=0.75, avg=0.74, std=0.00, steps=4.917e+07
2023-07-07 02:35:57,718 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 3100, best=0.75, avg=0.74, std=0.00, steps=5.081e+07
2023-07-07 02:36:12,599 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 3200, best=0.75, avg=0.74, std=0.00, steps=5.245e+07
2023-07-07 02:36:27,504 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 3300, best=0.75, avg=0.74, std=0.00, steps=5.408e+07
2023-07-07 02:36:42,395 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 3400, best=0.75, avg=0.75, std=0.00, steps=5.572e+07
2023-07-07 02:36:57,259 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 3500, best=0.75, avg=0.75, std=0.00, steps=5.736e+07
2023-07-07 02:37:12,133 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 3600, best=0.76, avg=0.75, std=0.00, steps=5.900e+07
2023-07-07 02:37:27,033 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 3700, best=0.76, avg=0.75, std=0.00, steps=6.064e+07
2023-07-07 02:37:41,991 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 3800, best=0.76, avg=0.75, std=0.00, steps=6.228e+07
2023-07-07 02:37:56,854 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 3900, best=0.76, avg=0.75, std=0.00, steps=6.391e+07
2023-07-07 02:38:11,767 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 4000, best=0.76, avg=0.75, std=0.00, steps=6.555e+07
2023-07-07 02:38:26,641 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 4100, best=0.76, avg=0.75, std=0.00, steps=6.719e+07
2023-07-07 02:38:41,515 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 4200, best=0.76, avg=0.75, std=0.00, steps=6.883e+07
2023-07-07 02:38:56,395 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 4300, best=0.77, avg=0.75, std=0.00, steps=7.047e+07
2023-07-07 02:39:11,321 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 4400, best=0.77, avg=0.76, std=0.00, steps=7.211e+07
2023-07-07 02:39:26,245 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 4500, best=0.77, avg=0.76, std=0.00, steps=7.374e+07
2023-07-07 02:39:41,265 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 4600, best=0.77, avg=0.76, std=0.00, steps=7.538e+07
2023-07-07 02:39:56,410 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 4700, best=0.77, avg=0.76, std=0.00, steps=7.702e+07
2023-07-07 02:40:11,371 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 4800, best=0.77, avg=0.76, std=0.00, steps=7.866e+07
2023-07-07 02:40:26,366 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 4900, best=0.77, avg=0.76, std=0.00, steps=8.030e+07
2023-07-07 02:40:41,246 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 5000, best=0.77, avg=0.76, std=0.00, steps=8.194e+07
2023-07-07 02:40:56,139 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 5100, best=0.78, avg=0.77, std=0.00, steps=8.357e+07
2023-07-07 02:41:11,070 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 5200, best=0.77, avg=0.77, std=0.00, steps=8.521e+07
2023-07-07 02:41:25,965 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 5300, best=0.78, avg=0.77, std=0.00, steps=8.685e+07
2023-07-07 02:41:40,844 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 5400, best=0.78, avg=0.77, std=0.00, steps=8.849e+07
2023-07-07 02:41:55,807 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 5500, best=0.78, avg=0.77, std=0.00, steps=9.013e+07
2023-07-07 02:42:10,716 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 5600, best=0.78, avg=0.77, std=0.00, steps=9.177e+07
2023-07-07 02:42:25,706 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 5700, best=0.78, avg=0.77, std=0.00, steps=9.341e+07
2023-07-07 02:42:40,676 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 5800, best=0.78, avg=0.77, std=0.00, steps=9.504e+07
2023-07-07 02:42:55,605 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 5900, best=0.78, avg=0.77, std=0.00, steps=9.668e+07
2023-07-07 02:43:10,510 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 6000, best=0.78, avg=0.78, std=0.00, steps=9.832e+07
2023-07-07 02:43:25,383 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 6100, best=0.78, avg=0.78, std=0.00, steps=9.996e+07
2023-07-07 02:43:40,197 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 6200, best=0.79, avg=0.78, std=0.00, steps=1.016e+08
2023-07-07 02:43:55,038 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 6300, best=0.79, avg=0.78, std=0.00, steps=1.032e+08
2023-07-07 02:44:09,870 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 6400, best=0.78, avg=0.78, std=0.00, steps=1.049e+08
2023-07-07 02:44:24,702 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 6500, best=0.78, avg=0.78, std=0.00, steps=1.065e+08
2023-07-07 02:44:39,534 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 6600, best=0.79, avg=0.78, std=0.00, steps=1.082e+08
2023-07-07 02:44:54,370 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 6700, best=0.79, avg=0.78, std=0.00, steps=1.098e+08
2023-07-07 02:45:09,349 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 6800, best=0.79, avg=0.78, std=0.00, steps=1.114e+08
2023-07-07 02:45:24,259 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 6900, best=0.79, avg=0.78, std=0.00, steps=1.131e+08
2023-07-07 02:45:39,152 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 7000, best=0.79, avg=0.78, std=0.00, steps=1.147e+08
2023-07-07 02:45:54,039 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 7100, best=0.79, avg=0.78, std=0.00, steps=1.163e+08
2023-07-07 02:46:08,947 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 7200, best=0.79, avg=0.78, std=0.00, steps=1.180e+08
2023-07-07 02:46:23,853 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 7300, best=0.79, avg=0.78, std=0.00, steps=1.196e+08
2023-07-07 02:46:38,823 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 7400, best=0.79, avg=0.79, std=0.00, steps=1.213e+08
2023-07-07 02:46:53,732 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 7500, best=0.79, avg=0.79, std=0.00, steps=1.229e+08
2023-07-07 02:47:08,730 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 7600, best=0.79, avg=0.79, std=0.00, steps=1.245e+08
2023-07-07 02:47:23,641 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 7700, best=0.79, avg=0.79, std=0.00, steps=1.262e+08
2023-07-07 02:47:38,546 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 7800, best=0.80, avg=0.79, std=0.00, steps=1.278e+08
2023-07-07 02:47:53,437 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 7900, best=0.80, avg=0.79, std=0.00, steps=1.294e+08
2023-07-07 02:48:08,305 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 8000, best=0.80, avg=0.79, std=0.00, steps=1.311e+08
2023-07-07 02:48:23,153 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 8100, best=0.80, avg=0.79, std=0.00, steps=1.327e+08
2023-07-07 02:48:38,147 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 8200, best=0.80, avg=0.79, std=0.00, steps=1.344e+08
2023-07-07 02:48:53,039 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 8300, best=0.80, avg=0.79, std=0.00, steps=1.360e+08
2023-07-07 02:49:07,923 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 8400, best=0.80, avg=0.79, std=0.00, steps=1.376e+08
2023-07-07 02:49:22,809 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 8500, best=0.80, avg=0.79, std=0.00, steps=1.393e+08
2023-07-07 02:49:37,699 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 8600, best=0.80, avg=0.79, std=0.00, steps=1.409e+08
2023-07-07 02:49:52,552 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 8700, best=0.80, avg=0.79, std=0.00, steps=1.426e+08
2023-07-07 02:50:07,404 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 8800, best=0.80, avg=0.79, std=0.00, steps=1.442e+08
2023-07-07 02:50:22,278 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 8900, best=0.80, avg=0.79, std=0.00, steps=1.458e+08
2023-07-07 02:50:37,132 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 9000, best=0.80, avg=0.79, std=0.00, steps=1.475e+08
2023-07-07 02:50:51,991 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 9100, best=0.80, avg=0.79, std=0.00, steps=1.491e+08
2023-07-07 02:51:06,872 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 9200, best=0.80, avg=0.79, std=0.00, steps=1.507e+08
2023-07-07 02:51:21,760 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 9300, best=0.80, avg=0.80, std=0.00, steps=1.524e+08
2023-07-07 02:51:36,625 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 9400, best=0.80, avg=0.80, std=0.00, steps=1.540e+08
2023-07-07 02:51:51,457 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 9500, best=0.80, avg=0.80, std=0.00, steps=1.557e+08
2023-07-07 02:52:06,339 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 9600, best=0.80, avg=0.80, std=0.00, steps=1.573e+08
2023-07-07 02:52:21,170 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 9700, best=0.80, avg=0.80, std=0.00, steps=1.589e+08
2023-07-07 02:52:36,094 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 9800, best=0.80, avg=0.80, std=0.00, steps=1.606e+08
2023-07-07 02:52:50,956 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 9900, best=0.80, avg=0.80, std=0.00, steps=1.622e+08
2023-07-07 02:53:05,938 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 10000, best=0.80, avg=0.80, std=0.00, steps=1.639e+08
2023-07-07 02:53:20,885 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 10100, best=0.81, avg=0.80, std=0.00, steps=1.655e+08
2023-07-07 02:53:35,850 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 10200, best=0.81, avg=0.80, std=0.00, steps=1.671e+08
2023-07-07 02:53:50,723 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 10300, best=0.81, avg=0.80, std=0.00, steps=1.688e+08
2023-07-07 02:54:05,647 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 10400, best=0.81, avg=0.80, std=0.00, steps=1.704e+08
2023-07-07 02:54:20,527 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 10500, best=0.81, avg=0.80, std=0.00, steps=1.720e+08
2023-07-07 02:54:35,522 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 10600, best=0.81, avg=0.80, std=0.00, steps=1.737e+08
2023-07-07 02:54:50,407 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 10700, best=0.81, avg=0.80, std=0.00, steps=1.753e+08
2023-07-07 02:55:05,362 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 10800, best=0.81, avg=0.80, std=0.00, steps=1.770e+08
2023-07-07 02:55:20,236 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 10900, best=0.81, avg=0.80, std=0.00, steps=1.786e+08
2023-07-07 02:55:35,194 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 11000, best=0.81, avg=0.80, std=0.00, steps=1.802e+08
2023-07-07 02:55:50,084 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 11100, best=0.81, avg=0.80, std=0.00, steps=1.819e+08
2023-07-07 02:56:04,948 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 11200, best=0.81, avg=0.80, std=0.00, steps=1.835e+08
2023-07-07 02:56:19,811 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 11300, best=0.81, avg=0.80, std=0.00, steps=1.852e+08
2023-07-07 02:56:34,684 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 11400, best=0.81, avg=0.81, std=0.00, steps=1.868e+08
2023-07-07 02:56:49,565 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 11500, best=0.81, avg=0.80, std=0.00, steps=1.884e+08
2023-07-07 02:57:04,481 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 11600, best=0.81, avg=0.80, std=0.00, steps=1.901e+08
2023-07-07 02:57:19,391 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 11700, best=0.81, avg=0.81, std=0.00, steps=1.917e+08
2023-07-07 02:57:34,386 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 11800, best=0.81, avg=0.81, std=0.00, steps=1.933e+08
2023-07-07 02:57:49,406 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 11900, best=0.81, avg=0.81, std=0.00, steps=1.950e+08
2023-07-07 02:58:04,144 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 0, [Train]: 11999, best=0.81, avg=0.81, std=0.00, steps=1.966e+08
2023-07-07 02:58:04,145 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 02:58:04,168 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 02:58:04,200 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 02:58:23,156 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 100, best=0.52, avg=0.51, std=0.00, steps=1.862e+06
2023-07-07 02:58:39,943 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 200, best=0.60, avg=0.60, std=0.00, steps=3.705e+06
2023-07-07 02:58:56,681 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 300, best=0.62, avg=0.62, std=0.00, steps=5.548e+06
2023-07-07 02:59:13,327 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 400, best=0.64, avg=0.63, std=0.00, steps=7.391e+06
2023-07-07 02:59:29,998 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 500, best=0.65, avg=0.64, std=0.00, steps=9.234e+06
2023-07-07 02:59:46,660 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 600, best=0.66, avg=0.65, std=0.00, steps=1.108e+07
2023-07-07 03:00:03,443 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 700, best=0.67, avg=0.66, std=0.00, steps=1.292e+07
2023-07-07 03:00:20,219 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 800, best=0.67, avg=0.66, std=0.00, steps=1.476e+07
2023-07-07 03:00:37,098 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 900, best=0.68, avg=0.67, std=0.00, steps=1.661e+07
2023-07-07 03:00:53,829 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 1000, best=0.68, avg=0.67, std=0.00, steps=1.845e+07
2023-07-07 03:01:10,552 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 1100, best=0.68, avg=0.68, std=0.00, steps=2.029e+07
2023-07-07 03:01:27,233 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 1200, best=0.68, avg=0.68, std=0.00, steps=2.214e+07
2023-07-07 03:01:43,922 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 1300, best=0.69, avg=0.68, std=0.00, steps=2.398e+07
2023-07-07 03:02:00,703 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 1400, best=0.69, avg=0.68, std=0.00, steps=2.582e+07
2023-07-07 03:02:17,429 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 1500, best=0.69, avg=0.68, std=0.00, steps=2.767e+07
2023-07-07 03:02:34,128 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 1600, best=0.69, avg=0.69, std=0.00, steps=2.951e+07
2023-07-07 03:02:50,912 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 1700, best=0.69, avg=0.69, std=0.00, steps=3.135e+07
2023-07-07 03:03:07,711 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 1800, best=0.70, avg=0.69, std=0.00, steps=3.320e+07
2023-07-07 03:03:24,390 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 1900, best=0.70, avg=0.69, std=0.00, steps=3.504e+07
2023-07-07 03:03:41,054 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 2000, best=0.70, avg=0.69, std=0.00, steps=3.688e+07
2023-07-07 03:03:57,777 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 2100, best=0.70, avg=0.69, std=0.00, steps=3.873e+07
2023-07-07 03:04:14,495 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 2200, best=0.70, avg=0.69, std=0.00, steps=4.057e+07
2023-07-07 03:04:31,287 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 2300, best=0.71, avg=0.70, std=0.00, steps=4.241e+07
2023-07-07 03:04:48,044 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 2400, best=0.70, avg=0.70, std=0.00, steps=4.426e+07
2023-07-07 03:05:04,890 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 2500, best=0.71, avg=0.70, std=0.00, steps=4.610e+07
2023-07-07 03:05:21,596 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 2600, best=0.71, avg=0.70, std=0.00, steps=4.794e+07
2023-07-07 03:05:38,340 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 2700, best=0.71, avg=0.70, std=0.00, steps=4.978e+07
2023-07-07 03:05:55,047 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 2800, best=0.71, avg=0.70, std=0.00, steps=5.163e+07
2023-07-07 03:06:11,705 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 2900, best=0.71, avg=0.70, std=0.00, steps=5.347e+07
2023-07-07 03:06:28,445 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 3000, best=0.71, avg=0.70, std=0.00, steps=5.531e+07
2023-07-07 03:06:45,157 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 3100, best=0.71, avg=0.71, std=0.00, steps=5.716e+07
2023-07-07 03:07:01,951 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 3200, best=0.71, avg=0.71, std=0.00, steps=5.900e+07
2023-07-07 03:07:18,622 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 3300, best=0.71, avg=0.71, std=0.00, steps=6.084e+07
2023-07-07 03:07:35,284 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 3400, best=0.72, avg=0.71, std=0.00, steps=6.269e+07
2023-07-07 03:07:51,994 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 3500, best=0.72, avg=0.71, std=0.00, steps=6.453e+07
2023-07-07 03:08:08,746 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 3600, best=0.72, avg=0.71, std=0.00, steps=6.637e+07
2023-07-07 03:08:25,391 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 3700, best=0.72, avg=0.71, std=0.00, steps=6.822e+07
2023-07-07 03:08:42,058 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 3800, best=0.72, avg=0.71, std=0.00, steps=7.006e+07
2023-07-07 03:08:58,764 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 3900, best=0.72, avg=0.71, std=0.00, steps=7.190e+07
2023-07-07 03:09:15,484 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 4000, best=0.72, avg=0.71, std=0.00, steps=7.375e+07
2023-07-07 03:09:32,170 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 4100, best=0.72, avg=0.71, std=0.00, steps=7.559e+07
2023-07-07 03:09:48,826 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 4200, best=0.72, avg=0.71, std=0.00, steps=7.743e+07
2023-07-07 03:10:05,521 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 4300, best=0.72, avg=0.72, std=0.00, steps=7.928e+07
2023-07-07 03:10:22,232 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 4400, best=0.72, avg=0.72, std=0.00, steps=8.112e+07
2023-07-07 03:10:38,910 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 4500, best=0.72, avg=0.72, std=0.00, steps=8.296e+07
2023-07-07 03:10:55,608 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 4600, best=0.72, avg=0.72, std=0.00, steps=8.481e+07
2023-07-07 03:11:12,310 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 4700, best=0.72, avg=0.72, std=0.00, steps=8.665e+07
2023-07-07 03:11:28,984 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 4800, best=0.72, avg=0.72, std=0.00, steps=8.849e+07
2023-07-07 03:11:45,634 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 4900, best=0.73, avg=0.72, std=0.00, steps=9.034e+07
2023-07-07 03:12:02,300 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 5000, best=0.73, avg=0.72, std=0.00, steps=9.218e+07
2023-07-07 03:12:19,009 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 5100, best=0.73, avg=0.72, std=0.00, steps=9.402e+07
2023-07-07 03:12:35,713 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 5200, best=0.73, avg=0.72, std=0.00, steps=9.586e+07
2023-07-07 03:12:52,478 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 5300, best=0.73, avg=0.72, std=0.00, steps=9.771e+07
2023-07-07 03:13:09,221 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 5400, best=0.73, avg=0.72, std=0.00, steps=9.955e+07
2023-07-07 03:13:25,943 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 5500, best=0.73, avg=0.72, std=0.00, steps=1.014e+08
2023-07-07 03:13:42,742 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 5600, best=0.73, avg=0.72, std=0.00, steps=1.032e+08
2023-07-07 03:13:59,482 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 5700, best=0.73, avg=0.72, std=0.00, steps=1.051e+08
2023-07-07 03:14:16,109 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 5800, best=0.73, avg=0.72, std=0.00, steps=1.069e+08
2023-07-07 03:14:32,833 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 5900, best=0.73, avg=0.72, std=0.00, steps=1.088e+08
2023-07-07 03:14:49,529 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 6000, best=0.73, avg=0.72, std=0.00, steps=1.106e+08
2023-07-07 03:15:06,312 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 6100, best=0.73, avg=0.72, std=0.00, steps=1.125e+08
2023-07-07 03:15:23,145 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 6200, best=0.74, avg=0.73, std=0.00, steps=1.143e+08
2023-07-07 03:15:39,882 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 6300, best=0.73, avg=0.73, std=0.00, steps=1.161e+08
2023-07-07 03:15:56,624 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 6400, best=0.73, avg=0.73, std=0.00, steps=1.180e+08
2023-07-07 03:16:13,380 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 6500, best=0.73, avg=0.73, std=0.00, steps=1.198e+08
2023-07-07 03:16:30,214 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 6600, best=0.73, avg=0.73, std=0.00, steps=1.217e+08
2023-07-07 03:16:46,998 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 6700, best=0.73, avg=0.73, std=0.00, steps=1.235e+08
2023-07-07 03:17:03,761 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 6800, best=0.74, avg=0.73, std=0.00, steps=1.254e+08
2023-07-07 03:17:20,449 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 6900, best=0.74, avg=0.73, std=0.00, steps=1.272e+08
2023-07-07 03:17:37,206 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 7000, best=0.74, avg=0.73, std=0.00, steps=1.290e+08
2023-07-07 03:17:53,981 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 7100, best=0.74, avg=0.73, std=0.00, steps=1.309e+08
2023-07-07 03:18:10,653 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 7200, best=0.74, avg=0.73, std=0.00, steps=1.327e+08
2023-07-07 03:18:27,297 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 7300, best=0.74, avg=0.73, std=0.00, steps=1.346e+08
2023-07-07 03:18:44,005 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 7400, best=0.74, avg=0.73, std=0.00, steps=1.364e+08
2023-07-07 03:19:00,788 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 7500, best=0.74, avg=0.73, std=0.00, steps=1.383e+08
2023-07-07 03:19:17,467 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 7600, best=0.74, avg=0.73, std=0.00, steps=1.401e+08
2023-07-07 03:19:34,220 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 7700, best=0.74, avg=0.73, std=0.00, steps=1.419e+08
2023-07-07 03:19:50,925 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 7800, best=0.74, avg=0.73, std=0.00, steps=1.438e+08
2023-07-07 03:20:07,622 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 7900, best=0.74, avg=0.73, std=0.00, steps=1.456e+08
2023-07-07 03:20:24,318 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 8000, best=0.74, avg=0.73, std=0.00, steps=1.475e+08
2023-07-07 03:20:41,024 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 8100, best=0.74, avg=0.73, std=0.00, steps=1.493e+08
2023-07-07 03:20:57,742 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 8200, best=0.74, avg=0.73, std=0.00, steps=1.512e+08
2023-07-07 03:21:14,428 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 8300, best=0.74, avg=0.73, std=0.00, steps=1.530e+08
2023-07-07 03:21:31,112 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 8400, best=0.74, avg=0.73, std=0.00, steps=1.548e+08
2023-07-07 03:21:47,882 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 8500, best=0.74, avg=0.74, std=0.00, steps=1.567e+08
2023-07-07 03:22:04,682 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 8600, best=0.74, avg=0.74, std=0.00, steps=1.585e+08
2023-07-07 03:22:21,461 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 8700, best=0.74, avg=0.74, std=0.00, steps=1.604e+08
2023-07-07 03:22:38,130 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 8800, best=0.74, avg=0.74, std=0.00, steps=1.622e+08
2023-07-07 03:22:54,824 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 8900, best=0.75, avg=0.74, std=0.00, steps=1.641e+08
2023-07-07 03:23:11,524 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 9000, best=0.74, avg=0.74, std=0.00, steps=1.659e+08
2023-07-07 03:23:28,296 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 9100, best=0.74, avg=0.74, std=0.00, steps=1.677e+08
2023-07-07 03:23:45,094 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 9200, best=0.75, avg=0.74, std=0.00, steps=1.696e+08
2023-07-07 03:24:01,829 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 9300, best=0.75, avg=0.74, std=0.00, steps=1.714e+08
2023-07-07 03:24:18,588 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 9400, best=0.75, avg=0.74, std=0.00, steps=1.733e+08
2023-07-07 03:24:35,469 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 9500, best=0.74, avg=0.74, std=0.00, steps=1.751e+08
2023-07-07 03:24:52,199 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 9600, best=0.75, avg=0.74, std=0.00, steps=1.770e+08
2023-07-07 03:25:08,963 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 9700, best=0.75, avg=0.74, std=0.00, steps=1.788e+08
2023-07-07 03:25:25,647 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 9800, best=0.75, avg=0.74, std=0.00, steps=1.807e+08
2023-07-07 03:25:42,423 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 9900, best=0.75, avg=0.74, std=0.00, steps=1.825e+08
2023-07-07 03:25:59,216 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 10000, best=0.75, avg=0.74, std=0.00, steps=1.843e+08
2023-07-07 03:26:15,920 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 10100, best=0.75, avg=0.74, std=0.00, steps=1.862e+08
2023-07-07 03:26:32,680 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 10200, best=0.75, avg=0.74, std=0.00, steps=1.880e+08
2023-07-07 03:26:49,378 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 10300, best=0.75, avg=0.74, std=0.00, steps=1.899e+08
2023-07-07 03:27:06,164 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 10400, best=0.75, avg=0.74, std=0.00, steps=1.917e+08
2023-07-07 03:27:22,940 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 10500, best=0.75, avg=0.74, std=0.00, steps=1.936e+08
2023-07-07 03:27:39,736 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 10600, best=0.75, avg=0.74, std=0.00, steps=1.954e+08
2023-07-07 03:27:56,511 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 10700, best=0.75, avg=0.74, std=0.00, steps=1.972e+08
2023-07-07 03:28:13,347 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 10800, best=0.75, avg=0.74, std=0.00, steps=1.991e+08
2023-07-07 03:28:30,066 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 10900, best=0.75, avg=0.74, std=0.00, steps=2.009e+08
2023-07-07 03:28:46,834 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 11000, best=0.75, avg=0.74, std=0.00, steps=2.028e+08
2023-07-07 03:29:03,643 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 11100, best=0.75, avg=0.74, std=0.00, steps=2.046e+08
2023-07-07 03:29:20,387 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 11200, best=0.75, avg=0.74, std=0.00, steps=2.065e+08
2023-07-07 03:29:37,171 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 11300, best=0.75, avg=0.74, std=0.00, steps=2.083e+08
2023-07-07 03:29:53,829 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 11400, best=0.75, avg=0.75, std=0.00, steps=2.101e+08
2023-07-07 03:30:10,475 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 11500, best=0.75, avg=0.75, std=0.00, steps=2.120e+08
2023-07-07 03:30:27,166 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 11600, best=0.75, avg=0.75, std=0.00, steps=2.138e+08
2023-07-07 03:30:43,814 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 11700, best=0.75, avg=0.75, std=0.00, steps=2.157e+08
2023-07-07 03:31:00,567 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 11800, best=0.76, avg=0.75, std=0.00, steps=2.175e+08
2023-07-07 03:31:17,279 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 11900, best=0.75, avg=0.75, std=0.00, steps=2.194e+08
2023-07-07 03:31:33,809 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 0, [Train]: 11999, best=0.75, avg=0.75, std=0.00, steps=2.212e+08
2023-07-07 03:31:33,810 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 03:31:33,834 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 03:31:33,864 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 03:31:54,501 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 100, best=0.51, avg=0.50, std=0.00, steps=2.068e+06
2023-07-07 03:32:13,076 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 200, best=0.51, avg=0.50, std=0.00, steps=4.116e+06
2023-07-07 03:32:31,746 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 300, best=0.51, avg=0.50, std=0.00, steps=6.164e+06
2023-07-07 03:32:50,483 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 400, best=0.51, avg=0.50, std=0.00, steps=8.212e+06
2023-07-07 03:33:08,994 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 500, best=0.51, avg=0.50, std=0.00, steps=1.026e+07
2023-07-07 03:33:27,558 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 600, best=0.51, avg=0.50, std=0.00, steps=1.231e+07
2023-07-07 03:33:46,008 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 700, best=0.51, avg=0.50, std=0.00, steps=1.436e+07
2023-07-07 03:34:04,526 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 800, best=0.51, avg=0.50, std=0.00, steps=1.640e+07
2023-07-07 03:34:23,082 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 900, best=0.51, avg=0.50, std=0.00, steps=1.845e+07
2023-07-07 03:34:41,864 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 1000, best=0.51, avg=0.50, std=0.00, steps=2.050e+07
2023-07-07 03:35:00,509 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 1100, best=0.51, avg=0.50, std=0.00, steps=2.255e+07
2023-07-07 03:35:19,137 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 1200, best=0.51, avg=0.50, std=0.00, steps=2.460e+07
2023-07-07 03:35:37,605 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 1300, best=0.51, avg=0.50, std=0.00, steps=2.664e+07
2023-07-07 03:35:56,100 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 1400, best=0.51, avg=0.50, std=0.00, steps=2.869e+07
2023-07-07 03:36:14,585 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 1500, best=0.51, avg=0.50, std=0.00, steps=3.074e+07
2023-07-07 03:36:33,072 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 1600, best=0.51, avg=0.50, std=0.00, steps=3.279e+07
2023-07-07 03:36:51,682 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 1700, best=0.51, avg=0.50, std=0.00, steps=3.484e+07
2023-07-07 03:37:10,284 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 1800, best=0.51, avg=0.50, std=0.00, steps=3.688e+07
2023-07-07 03:37:28,824 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 1900, best=0.51, avg=0.50, std=0.00, steps=3.893e+07
2023-07-07 03:37:47,327 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 2000, best=0.51, avg=0.50, std=0.00, steps=4.098e+07
2023-07-07 03:38:05,825 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 2100, best=0.51, avg=0.50, std=0.00, steps=4.303e+07
2023-07-07 03:38:24,320 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 2200, best=0.51, avg=0.50, std=0.00, steps=4.508e+07
2023-07-07 03:38:42,814 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 2300, best=0.51, avg=0.50, std=0.00, steps=4.712e+07
2023-07-07 03:39:01,303 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 2400, best=0.51, avg=0.50, std=0.00, steps=4.917e+07
2023-07-07 03:39:19,803 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 2500, best=0.51, avg=0.50, std=0.00, steps=5.122e+07
2023-07-07 03:39:38,292 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 2600, best=0.51, avg=0.50, std=0.00, steps=5.327e+07
2023-07-07 03:39:56,775 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 2700, best=0.51, avg=0.50, std=0.00, steps=5.532e+07
2023-07-07 03:40:15,252 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 2800, best=0.51, avg=0.50, std=0.00, steps=5.736e+07
2023-07-07 03:40:33,747 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 2900, best=0.51, avg=0.50, std=0.00, steps=5.941e+07
2023-07-07 03:40:52,305 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 3000, best=0.51, avg=0.50, std=0.00, steps=6.146e+07
2023-07-07 03:41:10,861 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 3100, best=0.51, avg=0.50, std=0.00, steps=6.351e+07
2023-07-07 03:41:29,400 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 3200, best=0.51, avg=0.50, std=0.00, steps=6.556e+07
2023-07-07 03:41:47,932 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 3300, best=0.51, avg=0.50, std=0.00, steps=6.760e+07
2023-07-07 03:42:06,521 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 3400, best=0.51, avg=0.50, std=0.00, steps=6.965e+07
2023-07-07 03:42:25,100 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 3500, best=0.51, avg=0.50, std=0.00, steps=7.170e+07
2023-07-07 03:42:43,651 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 3600, best=0.51, avg=0.50, std=0.00, steps=7.375e+07
2023-07-07 03:43:02,283 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 3700, best=0.51, avg=0.50, std=0.00, steps=7.580e+07
2023-07-07 03:43:20,896 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 3800, best=0.51, avg=0.50, std=0.00, steps=7.784e+07
2023-07-07 03:43:39,407 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 3900, best=0.51, avg=0.50, std=0.00, steps=7.989e+07
2023-07-07 03:43:57,885 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 4000, best=0.51, avg=0.50, std=0.00, steps=8.194e+07
2023-07-07 03:44:16,414 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 4100, best=0.51, avg=0.50, std=0.00, steps=8.399e+07
2023-07-07 03:44:34,949 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 4200, best=0.52, avg=0.50, std=0.00, steps=8.604e+07
2023-07-07 03:44:53,471 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 4300, best=0.51, avg=0.50, std=0.00, steps=8.808e+07
2023-07-07 03:45:11,998 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 4400, best=0.51, avg=0.50, std=0.00, steps=9.013e+07
2023-07-07 03:45:30,459 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 4500, best=0.51, avg=0.50, std=0.00, steps=9.218e+07
2023-07-07 03:45:48,932 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 4600, best=0.52, avg=0.50, std=0.00, steps=9.423e+07
2023-07-07 03:46:07,428 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 4700, best=0.51, avg=0.50, std=0.00, steps=9.628e+07
2023-07-07 03:46:25,909 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 4800, best=0.52, avg=0.50, std=0.00, steps=9.832e+07
2023-07-07 03:46:44,379 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 4900, best=0.51, avg=0.50, std=0.00, steps=1.004e+08
2023-07-07 03:47:02,932 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 5000, best=0.51, avg=0.50, std=0.00, steps=1.024e+08
2023-07-07 03:47:21,539 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 5100, best=0.51, avg=0.50, std=0.00, steps=1.045e+08
2023-07-07 03:47:40,059 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 5200, best=0.51, avg=0.50, std=0.00, steps=1.065e+08
2023-07-07 03:47:58,580 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 5300, best=0.51, avg=0.50, std=0.00, steps=1.086e+08
2023-07-07 03:48:17,139 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 5400, best=0.52, avg=0.50, std=0.00, steps=1.106e+08
2023-07-07 03:48:35,807 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 5500, best=0.51, avg=0.50, std=0.00, steps=1.127e+08
2023-07-07 03:48:54,295 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 5600, best=0.51, avg=0.50, std=0.00, steps=1.147e+08
2023-07-07 03:49:12,811 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 5700, best=0.51, avg=0.50, std=0.00, steps=1.168e+08
2023-07-07 03:49:31,422 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 5800, best=0.51, avg=0.50, std=0.00, steps=1.188e+08
2023-07-07 03:49:50,007 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 5900, best=0.51, avg=0.50, std=0.00, steps=1.209e+08
2023-07-07 03:50:08,596 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 6000, best=0.51, avg=0.50, std=0.00, steps=1.229e+08
2023-07-07 03:50:27,227 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 6100, best=0.51, avg=0.50, std=0.00, steps=1.249e+08
2023-07-07 03:50:45,747 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 6200, best=0.51, avg=0.50, std=0.00, steps=1.270e+08
2023-07-07 03:51:04,248 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 6300, best=0.51, avg=0.50, std=0.00, steps=1.290e+08
2023-07-07 03:51:22,770 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 6400, best=0.51, avg=0.50, std=0.00, steps=1.311e+08
2023-07-07 03:51:41,297 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 6500, best=0.51, avg=0.50, std=0.00, steps=1.331e+08
2023-07-07 03:51:59,802 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 6600, best=0.51, avg=0.50, std=0.00, steps=1.352e+08
2023-07-07 03:52:18,288 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 6700, best=0.51, avg=0.50, std=0.00, steps=1.372e+08
2023-07-07 03:52:36,777 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 6800, best=0.51, avg=0.50, std=0.00, steps=1.393e+08
2023-07-07 03:52:55,246 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 6900, best=0.51, avg=0.50, std=0.00, steps=1.413e+08
2023-07-07 03:53:13,840 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 7000, best=0.51, avg=0.50, std=0.00, steps=1.434e+08
2023-07-07 03:53:32,338 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 7100, best=0.51, avg=0.50, std=0.00, steps=1.454e+08
2023-07-07 03:53:50,801 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 7200, best=0.51, avg=0.50, std=0.00, steps=1.475e+08
2023-07-07 03:54:09,412 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 7300, best=0.51, avg=0.50, std=0.00, steps=1.495e+08
2023-07-07 03:54:27,933 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 7400, best=0.51, avg=0.50, std=0.00, steps=1.516e+08
2023-07-07 03:54:46,431 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 7500, best=0.51, avg=0.50, std=0.00, steps=1.536e+08
2023-07-07 03:55:04,988 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 7600, best=0.51, avg=0.50, std=0.00, steps=1.557e+08
2023-07-07 03:55:23,553 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 7700, best=0.51, avg=0.50, std=0.00, steps=1.577e+08
2023-07-07 03:55:42,174 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 7800, best=0.51, avg=0.50, std=0.00, steps=1.598e+08
2023-07-07 03:56:00,744 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 7900, best=0.51, avg=0.50, std=0.00, steps=1.618e+08
2023-07-07 03:56:19,354 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 8000, best=0.51, avg=0.50, std=0.00, steps=1.639e+08
2023-07-07 03:56:37,945 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 8100, best=0.51, avg=0.50, std=0.00, steps=1.659e+08
2023-07-07 03:56:56,471 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 8200, best=0.51, avg=0.50, std=0.00, steps=1.680e+08
2023-07-07 03:57:15,056 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 8300, best=0.51, avg=0.50, std=0.00, steps=1.700e+08
2023-07-07 03:57:33,627 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 8400, best=0.51, avg=0.50, std=0.00, steps=1.721e+08
2023-07-07 03:57:52,164 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 8500, best=0.51, avg=0.50, std=0.00, steps=1.741e+08
2023-07-07 03:58:10,684 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 8600, best=0.51, avg=0.50, std=0.00, steps=1.761e+08
2023-07-07 03:58:29,230 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 8700, best=0.51, avg=0.50, std=0.00, steps=1.782e+08
2023-07-07 03:58:47,733 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 8800, best=0.51, avg=0.50, std=0.00, steps=1.802e+08
2023-07-07 03:59:06,287 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 8900, best=0.51, avg=0.50, std=0.00, steps=1.823e+08
2023-07-07 03:59:24,847 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 9000, best=0.51, avg=0.50, std=0.00, steps=1.843e+08
2023-07-07 03:59:43,498 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 9100, best=0.51, avg=0.50, std=0.00, steps=1.864e+08
2023-07-07 04:00:02,027 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 9200, best=0.51, avg=0.50, std=0.00, steps=1.884e+08
2023-07-07 04:00:20,626 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 9300, best=0.51, avg=0.50, std=0.00, steps=1.905e+08
2023-07-07 04:00:39,172 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 9400, best=0.51, avg=0.50, std=0.00, steps=1.925e+08
2023-07-07 04:00:57,667 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 9500, best=0.51, avg=0.50, std=0.00, steps=1.946e+08
2023-07-07 04:01:16,267 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 9600, best=0.51, avg=0.50, std=0.00, steps=1.966e+08
2023-07-07 04:01:34,913 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 9700, best=0.51, avg=0.50, std=0.00, steps=1.987e+08
2023-07-07 04:01:53,427 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 9800, best=0.51, avg=0.50, std=0.00, steps=2.007e+08
2023-07-07 04:02:11,951 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 9900, best=0.51, avg=0.50, std=0.00, steps=2.028e+08
2023-07-07 04:02:30,515 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 10000, best=0.51, avg=0.50, std=0.00, steps=2.048e+08
2023-07-07 04:02:49,045 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 10100, best=0.51, avg=0.50, std=0.00, steps=2.069e+08
2023-07-07 04:03:07,604 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 10200, best=0.51, avg=0.50, std=0.00, steps=2.089e+08
2023-07-07 04:03:26,177 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 10300, best=0.51, avg=0.50, std=0.00, steps=2.110e+08
2023-07-07 04:03:44,675 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 10400, best=0.51, avg=0.50, std=0.00, steps=2.130e+08
2023-07-07 04:04:03,217 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 10500, best=0.51, avg=0.50, std=0.00, steps=2.151e+08
2023-07-07 04:04:21,711 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 10600, best=0.51, avg=0.50, std=0.00, steps=2.171e+08
2023-07-07 04:04:40,204 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 10700, best=0.51, avg=0.50, std=0.00, steps=2.192e+08
2023-07-07 04:04:58,736 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 10800, best=0.51, avg=0.50, std=0.00, steps=2.212e+08
2023-07-07 04:05:17,221 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 10900, best=0.51, avg=0.50, std=0.00, steps=2.233e+08
2023-07-07 04:05:35,749 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 11000, best=0.51, avg=0.50, std=0.00, steps=2.253e+08
2023-07-07 04:05:54,302 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 11100, best=0.51, avg=0.50, std=0.00, steps=2.273e+08
2023-07-07 04:06:12,948 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 11200, best=0.51, avg=0.50, std=0.00, steps=2.294e+08
2023-07-07 04:06:31,575 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 11300, best=0.51, avg=0.50, std=0.00, steps=2.314e+08
2023-07-07 04:06:50,135 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 11400, best=0.51, avg=0.50, std=0.00, steps=2.335e+08
2023-07-07 04:07:08,672 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 11500, best=0.51, avg=0.50, std=0.00, steps=2.355e+08
2023-07-07 04:07:27,312 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 11600, best=0.51, avg=0.50, std=0.00, steps=2.376e+08
2023-07-07 04:07:45,862 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 11700, best=0.51, avg=0.50, std=0.00, steps=2.396e+08
2023-07-07 04:08:04,379 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 11800, best=0.51, avg=0.50, std=0.00, steps=2.417e+08
2023-07-07 04:08:22,896 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 11900, best=0.51, avg=0.50, std=0.00, steps=2.437e+08
2023-07-07 04:08:41,442 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 0, [Train]: 11999, best=0.51, avg=0.50, std=0.00, steps=2.458e+08
2023-07-07 04:08:41,443 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 04:08:41,466 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 04:08:41,497 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 04:09:05,947 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 100, best=0.51, avg=0.50, std=0.00, steps=2.482e+06
2023-07-07 04:09:28,277 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 200, best=0.51, avg=0.50, std=0.00, steps=4.940e+06
2023-07-07 04:09:50,496 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 300, best=0.51, avg=0.50, std=0.00, steps=7.397e+06
2023-07-07 04:10:12,746 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 400, best=0.56, avg=0.56, std=0.00, steps=9.855e+06
2023-07-07 04:10:34,970 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 500, best=0.58, avg=0.57, std=0.00, steps=1.231e+07
2023-07-07 04:10:57,241 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 600, best=0.59, avg=0.58, std=0.00, steps=1.477e+07
2023-07-07 04:11:19,412 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 700, best=0.60, avg=0.59, std=0.00, steps=1.723e+07
2023-07-07 04:11:41,674 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 800, best=0.60, avg=0.59, std=0.00, steps=1.969e+07
2023-07-07 04:12:03,940 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 900, best=0.61, avg=0.60, std=0.00, steps=2.214e+07
2023-07-07 04:12:26,207 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 1000, best=0.62, avg=0.61, std=0.00, steps=2.460e+07
2023-07-07 04:12:48,438 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 1100, best=0.62, avg=0.61, std=0.00, steps=2.706e+07
2023-07-07 04:13:10,603 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 1200, best=0.62, avg=0.62, std=0.00, steps=2.952e+07
2023-07-07 04:13:32,802 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 1300, best=0.63, avg=0.62, std=0.00, steps=3.197e+07
2023-07-07 04:13:55,054 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 1400, best=0.63, avg=0.63, std=0.00, steps=3.443e+07
2023-07-07 04:14:17,439 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 1500, best=0.64, avg=0.63, std=0.00, steps=3.689e+07
2023-07-07 04:14:39,648 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 1600, best=0.64, avg=0.63, std=0.00, steps=3.935e+07
2023-07-07 04:15:01,843 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 1700, best=0.64, avg=0.63, std=0.00, steps=4.180e+07
2023-07-07 04:15:23,979 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 1800, best=0.64, avg=0.63, std=0.00, steps=4.426e+07
2023-07-07 04:15:46,194 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 1900, best=0.64, avg=0.64, std=0.00, steps=4.672e+07
2023-07-07 04:16:08,478 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 2000, best=0.64, avg=0.64, std=0.00, steps=4.918e+07
2023-07-07 04:16:30,798 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 2100, best=0.64, avg=0.64, std=0.00, steps=5.163e+07
2023-07-07 04:16:52,945 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 2200, best=0.65, avg=0.64, std=0.00, steps=5.409e+07
2023-07-07 04:17:15,228 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 2300, best=0.65, avg=0.64, std=0.00, steps=5.655e+07
2023-07-07 04:17:37,500 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 2400, best=0.65, avg=0.64, std=0.00, steps=5.901e+07
2023-07-07 04:17:59,712 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 2500, best=0.65, avg=0.64, std=0.00, steps=6.146e+07
2023-07-07 04:18:21,898 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 2600, best=0.65, avg=0.64, std=0.00, steps=6.392e+07
2023-07-07 04:18:44,222 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 2700, best=0.65, avg=0.64, std=0.00, steps=6.638e+07
2023-07-07 04:19:06,504 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 2800, best=0.65, avg=0.64, std=0.00, steps=6.884e+07
2023-07-07 04:19:28,722 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 2900, best=0.65, avg=0.64, std=0.00, steps=7.129e+07
2023-07-07 04:19:50,864 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 3000, best=0.65, avg=0.64, std=0.00, steps=7.375e+07
2023-07-07 04:20:13,087 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 3100, best=0.65, avg=0.64, std=0.00, steps=7.621e+07
2023-07-07 04:20:35,294 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 3200, best=0.65, avg=0.65, std=0.00, steps=7.867e+07
2023-07-07 04:20:57,506 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 3300, best=0.65, avg=0.65, std=0.00, steps=8.113e+07
2023-07-07 04:21:19,792 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 3400, best=0.65, avg=0.65, std=0.00, steps=8.358e+07
2023-07-07 04:21:42,048 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 3500, best=0.65, avg=0.65, std=0.00, steps=8.604e+07
2023-07-07 04:22:04,391 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 3600, best=0.65, avg=0.65, std=0.00, steps=8.850e+07
2023-07-07 04:22:26,598 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 3700, best=0.65, avg=0.65, std=0.00, steps=9.096e+07
2023-07-07 04:22:48,729 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 3800, best=0.65, avg=0.65, std=0.00, steps=9.341e+07
2023-07-07 04:23:10,928 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 3900, best=0.65, avg=0.65, std=0.00, steps=9.587e+07
2023-07-07 04:23:33,222 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 4000, best=0.66, avg=0.65, std=0.00, steps=9.833e+07
2023-07-07 04:23:55,453 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 4100, best=0.65, avg=0.65, std=0.00, steps=1.008e+08
2023-07-07 04:24:17,832 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 4200, best=0.66, avg=0.65, std=0.00, steps=1.032e+08
2023-07-07 04:24:39,980 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 4300, best=0.66, avg=0.65, std=0.00, steps=1.057e+08
2023-07-07 04:25:02,302 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 4400, best=0.66, avg=0.65, std=0.00, steps=1.082e+08
2023-07-07 04:25:24,420 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 4500, best=0.66, avg=0.65, std=0.00, steps=1.106e+08
2023-07-07 04:25:46,585 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 4600, best=0.66, avg=0.65, std=0.00, steps=1.131e+08
2023-07-07 04:26:08,895 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 4700, best=0.66, avg=0.65, std=0.00, steps=1.155e+08
2023-07-07 04:26:31,179 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 4800, best=0.66, avg=0.65, std=0.00, steps=1.180e+08
2023-07-07 04:26:53,349 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 4900, best=0.66, avg=0.65, std=0.00, steps=1.204e+08
2023-07-07 04:27:15,466 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 5000, best=0.66, avg=0.65, std=0.00, steps=1.229e+08
2023-07-07 04:27:37,629 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 5100, best=0.66, avg=0.65, std=0.00, steps=1.254e+08
2023-07-07 04:27:59,768 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 5200, best=0.66, avg=0.65, std=0.00, steps=1.278e+08
2023-07-07 04:28:22,003 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 5300, best=0.66, avg=0.65, std=0.00, steps=1.303e+08
2023-07-07 04:28:44,182 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 5400, best=0.66, avg=0.65, std=0.00, steps=1.327e+08
2023-07-07 04:29:06,386 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 5500, best=0.66, avg=0.65, std=0.00, steps=1.352e+08
2023-07-07 04:29:28,673 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 5600, best=0.66, avg=0.65, std=0.00, steps=1.377e+08
2023-07-07 04:29:50,940 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 5700, best=0.66, avg=0.65, std=0.00, steps=1.401e+08
2023-07-07 04:30:13,244 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 5800, best=0.66, avg=0.65, std=0.00, steps=1.426e+08
2023-07-07 04:30:35,353 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 5900, best=0.66, avg=0.65, std=0.00, steps=1.450e+08
2023-07-07 04:30:57,590 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 6000, best=0.66, avg=0.65, std=0.00, steps=1.475e+08
2023-07-07 04:31:19,768 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 6100, best=0.66, avg=0.65, std=0.00, steps=1.499e+08
2023-07-07 04:31:41,971 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 6200, best=0.66, avg=0.66, std=0.00, steps=1.524e+08
2023-07-07 04:32:04,175 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 6300, best=0.66, avg=0.66, std=0.00, steps=1.549e+08
2023-07-07 04:32:26,559 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 6400, best=0.66, avg=0.65, std=0.00, steps=1.573e+08
2023-07-07 04:32:48,834 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 6500, best=0.66, avg=0.66, std=0.00, steps=1.598e+08
2023-07-07 04:33:11,035 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 6600, best=0.66, avg=0.66, std=0.00, steps=1.622e+08
2023-07-07 04:33:33,239 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 6700, best=0.67, avg=0.66, std=0.00, steps=1.647e+08
2023-07-07 04:33:55,534 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 6800, best=0.66, avg=0.66, std=0.00, steps=1.671e+08
2023-07-07 04:34:17,755 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 6900, best=0.66, avg=0.66, std=0.00, steps=1.696e+08
2023-07-07 04:34:40,168 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 7000, best=0.67, avg=0.66, std=0.00, steps=1.721e+08
2023-07-07 04:35:02,515 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 7100, best=0.67, avg=0.66, std=0.00, steps=1.745e+08
2023-07-07 04:35:24,817 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 7200, best=0.67, avg=0.66, std=0.00, steps=1.770e+08
2023-07-07 04:35:46,941 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 7300, best=0.67, avg=0.66, std=0.00, steps=1.794e+08
2023-07-07 04:36:09,154 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 7400, best=0.67, avg=0.66, std=0.00, steps=1.819e+08
2023-07-07 04:36:31,317 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 7500, best=0.67, avg=0.66, std=0.00, steps=1.843e+08
2023-07-07 04:36:53,459 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 7600, best=0.67, avg=0.66, std=0.00, steps=1.868e+08
2023-07-07 04:37:15,638 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 7700, best=0.67, avg=0.66, std=0.00, steps=1.893e+08
2023-07-07 04:37:37,785 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 7800, best=0.67, avg=0.66, std=0.00, steps=1.917e+08
2023-07-07 04:37:59,918 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 7900, best=0.67, avg=0.66, std=0.00, steps=1.942e+08
2023-07-07 04:38:22,074 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 8000, best=0.67, avg=0.66, std=0.00, steps=1.966e+08
2023-07-07 04:38:44,252 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 8100, best=0.67, avg=0.67, std=0.00, steps=1.991e+08
2023-07-07 04:39:06,559 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 8200, best=0.67, avg=0.67, std=0.00, steps=2.015e+08
2023-07-07 04:39:28,882 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 8300, best=0.67, avg=0.67, std=0.00, steps=2.040e+08
2023-07-07 04:39:51,192 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 8400, best=0.67, avg=0.67, std=0.00, steps=2.065e+08
2023-07-07 04:40:13,496 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 8500, best=0.67, avg=0.67, std=0.00, steps=2.089e+08
2023-07-07 04:40:35,797 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 8600, best=0.67, avg=0.67, std=0.00, steps=2.114e+08
2023-07-07 04:40:58,001 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 8700, best=0.67, avg=0.67, std=0.00, steps=2.138e+08
2023-07-07 04:41:20,134 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 8800, best=0.67, avg=0.67, std=0.00, steps=2.163e+08
2023-07-07 04:41:42,322 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 8900, best=0.67, avg=0.67, std=0.00, steps=2.188e+08
2023-07-07 04:42:04,464 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 9000, best=0.67, avg=0.67, std=0.00, steps=2.212e+08
2023-07-07 04:42:26,669 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 9100, best=0.68, avg=0.67, std=0.00, steps=2.237e+08
2023-07-07 04:42:48,847 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 9200, best=0.68, avg=0.67, std=0.00, steps=2.261e+08
2023-07-07 04:43:11,028 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 9300, best=0.68, avg=0.67, std=0.00, steps=2.286e+08
2023-07-07 04:43:33,200 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 9400, best=0.68, avg=0.67, std=0.00, steps=2.310e+08
2023-07-07 04:43:55,500 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 9500, best=0.67, avg=0.67, std=0.00, steps=2.335e+08
2023-07-07 04:44:17,820 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 9600, best=0.68, avg=0.67, std=0.00, steps=2.360e+08
2023-07-07 04:44:40,013 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 9700, best=0.67, avg=0.67, std=0.00, steps=2.384e+08
2023-07-07 04:45:02,282 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 9800, best=0.68, avg=0.67, std=0.00, steps=2.409e+08
2023-07-07 04:45:24,538 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 9900, best=0.68, avg=0.67, std=0.00, steps=2.433e+08
2023-07-07 04:45:46,709 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 10000, best=0.67, avg=0.67, std=0.00, steps=2.458e+08
2023-07-07 04:46:08,985 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 10100, best=0.68, avg=0.67, std=0.00, steps=2.482e+08
2023-07-07 04:46:31,296 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 10200, best=0.68, avg=0.67, std=0.00, steps=2.507e+08
2023-07-07 04:46:53,468 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 10300, best=0.68, avg=0.67, std=0.00, steps=2.532e+08
2023-07-07 04:47:15,609 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 10400, best=0.68, avg=0.67, std=0.00, steps=2.556e+08
2023-07-07 04:47:37,814 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 10500, best=0.68, avg=0.67, std=0.00, steps=2.581e+08
2023-07-07 04:48:00,152 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 10600, best=0.68, avg=0.67, std=0.00, steps=2.605e+08
2023-07-07 04:48:22,406 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 10700, best=0.68, avg=0.67, std=0.00, steps=2.630e+08
2023-07-07 04:48:44,567 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 10800, best=0.68, avg=0.67, std=0.00, steps=2.654e+08
2023-07-07 04:49:06,746 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 10900, best=0.68, avg=0.67, std=0.00, steps=2.679e+08
2023-07-07 04:49:28,949 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 11000, best=0.68, avg=0.67, std=0.00, steps=2.704e+08
2023-07-07 04:49:51,206 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 11100, best=0.68, avg=0.67, std=0.00, steps=2.728e+08
2023-07-07 04:50:13,398 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 11200, best=0.68, avg=0.67, std=0.00, steps=2.753e+08
2023-07-07 04:50:35,585 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 11300, best=0.68, avg=0.67, std=0.00, steps=2.777e+08
2023-07-07 04:50:57,761 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 11400, best=0.68, avg=0.67, std=0.00, steps=2.802e+08
2023-07-07 04:51:20,028 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 11500, best=0.68, avg=0.67, std=0.00, steps=2.826e+08
2023-07-07 04:51:42,276 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 11600, best=0.68, avg=0.67, std=0.00, steps=2.851e+08
2023-07-07 04:52:04,524 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 11700, best=0.68, avg=0.67, std=0.00, steps=2.876e+08
2023-07-07 04:52:26,725 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 11800, best=0.68, avg=0.67, std=0.00, steps=2.900e+08
2023-07-07 04:52:48,854 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 11900, best=0.68, avg=0.68, std=0.00, steps=2.925e+08
2023-07-07 04:53:10,919 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 0, [Train]: 11999, best=0.68, avg=0.68, std=0.00, steps=2.949e+08
2023-07-07 04:53:10,920 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 04:53:10,943 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 04:53:10,972 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 04:53:43,216 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 100, best=0.51, avg=0.50, std=0.00, steps=3.310e+06
2023-07-07 04:54:12,623 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 200, best=0.51, avg=0.50, std=0.00, steps=6.586e+06
2023-07-07 04:54:42,273 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 300, best=0.51, avg=0.50, std=0.00, steps=9.863e+06
2023-07-07 04:55:11,797 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 400, best=0.51, avg=0.50, std=0.00, steps=1.314e+07
2023-07-07 04:55:41,394 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 500, best=0.51, avg=0.50, std=0.00, steps=1.642e+07
2023-07-07 04:56:11,091 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 600, best=0.51, avg=0.50, std=0.00, steps=1.969e+07
2023-07-07 04:56:40,776 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 700, best=0.51, avg=0.50, std=0.00, steps=2.297e+07
2023-07-07 04:57:10,215 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 800, best=0.51, avg=0.50, std=0.00, steps=2.625e+07
2023-07-07 04:57:39,679 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 900, best=0.51, avg=0.50, std=0.00, steps=2.952e+07
2023-07-07 04:58:09,247 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 1000, best=0.51, avg=0.50, std=0.00, steps=3.280e+07
2023-07-07 04:58:38,831 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 1100, best=0.51, avg=0.50, std=0.00, steps=3.608e+07
2023-07-07 04:59:08,391 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 1200, best=0.51, avg=0.50, std=0.00, steps=3.935e+07
2023-07-07 04:59:37,870 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 1300, best=0.51, avg=0.50, std=0.00, steps=4.263e+07
2023-07-07 05:00:07,456 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 1400, best=0.51, avg=0.50, std=0.00, steps=4.591e+07
2023-07-07 05:00:37,050 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 1500, best=0.51, avg=0.50, std=0.00, steps=4.918e+07
2023-07-07 05:01:06,713 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 1600, best=0.51, avg=0.50, std=0.00, steps=5.246e+07
2023-07-07 05:01:36,325 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 1700, best=0.51, avg=0.50, std=0.00, steps=5.574e+07
2023-07-07 05:02:05,783 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 1800, best=0.51, avg=0.50, std=0.00, steps=5.902e+07
2023-07-07 05:02:35,262 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 1900, best=0.51, avg=0.50, std=0.00, steps=6.229e+07
2023-07-07 05:03:04,799 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 2000, best=0.51, avg=0.50, std=0.00, steps=6.557e+07
2023-07-07 05:03:34,390 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 2100, best=0.51, avg=0.50, std=0.00, steps=6.885e+07
2023-07-07 05:04:03,879 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 2200, best=0.51, avg=0.50, std=0.00, steps=7.212e+07
2023-07-07 05:04:33,419 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 2300, best=0.51, avg=0.50, std=0.00, steps=7.540e+07
2023-07-07 05:05:02,959 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 2400, best=0.51, avg=0.50, std=0.00, steps=7.868e+07
2023-07-07 05:05:32,329 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 2500, best=0.51, avg=0.50, std=0.00, steps=8.195e+07
2023-07-07 05:06:01,859 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 2600, best=0.51, avg=0.50, std=0.00, steps=8.523e+07
2023-07-07 05:06:31,507 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 2700, best=0.51, avg=0.50, std=0.00, steps=8.851e+07
2023-07-07 05:07:01,142 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 2800, best=0.51, avg=0.50, std=0.00, steps=9.178e+07
2023-07-07 05:07:30,801 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 2900, best=0.51, avg=0.50, std=0.00, steps=9.506e+07
2023-07-07 05:08:00,410 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 3000, best=0.51, avg=0.50, std=0.00, steps=9.834e+07
2023-07-07 05:08:29,911 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 3100, best=0.51, avg=0.50, std=0.00, steps=1.016e+08
2023-07-07 05:08:59,442 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 3200, best=0.50, avg=0.50, std=0.00, steps=1.049e+08
2023-07-07 05:09:29,105 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 3300, best=0.51, avg=0.50, std=0.00, steps=1.082e+08
2023-07-07 05:09:58,807 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 3400, best=0.51, avg=0.50, std=0.00, steps=1.114e+08
2023-07-07 05:10:28,475 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 3500, best=0.51, avg=0.50, std=0.00, steps=1.147e+08
2023-07-07 05:10:58,107 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 3600, best=0.51, avg=0.50, std=0.00, steps=1.180e+08
2023-07-07 05:11:27,690 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 3700, best=0.51, avg=0.50, std=0.00, steps=1.213e+08
2023-07-07 05:11:57,266 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 3800, best=0.51, avg=0.50, std=0.00, steps=1.246e+08
2023-07-07 05:12:26,867 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 3900, best=0.51, avg=0.50, std=0.00, steps=1.278e+08
2023-07-07 05:12:56,369 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 4000, best=0.51, avg=0.50, std=0.00, steps=1.311e+08
2023-07-07 05:13:25,790 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 4100, best=0.51, avg=0.50, std=0.00, steps=1.344e+08
2023-07-07 05:13:55,180 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 4200, best=0.51, avg=0.50, std=0.00, steps=1.377e+08
2023-07-07 05:14:24,735 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 4300, best=0.51, avg=0.50, std=0.00, steps=1.409e+08
2023-07-07 05:14:54,312 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 4400, best=0.53, avg=0.53, std=0.00, steps=1.442e+08
2023-07-07 05:15:23,769 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 4500, best=0.55, avg=0.55, std=0.00, steps=1.475e+08
2023-07-07 05:15:53,257 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 4600, best=0.56, avg=0.56, std=0.00, steps=1.508e+08
2023-07-07 05:16:22,735 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 4700, best=0.58, avg=0.57, std=0.00, steps=1.540e+08
2023-07-07 05:16:52,337 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 4800, best=0.58, avg=0.58, std=0.00, steps=1.573e+08
2023-07-07 05:17:21,815 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 4900, best=0.59, avg=0.58, std=0.00, steps=1.606e+08
2023-07-07 05:17:51,304 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 5000, best=0.60, avg=0.59, std=0.00, steps=1.639e+08
2023-07-07 05:18:20,849 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 5100, best=0.60, avg=0.60, std=0.00, steps=1.671e+08
2023-07-07 05:18:50,272 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 5200, best=0.60, avg=0.60, std=0.00, steps=1.704e+08
2023-07-07 05:19:19,654 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 5300, best=0.61, avg=0.60, std=0.00, steps=1.737e+08
2023-07-07 05:19:49,066 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 5400, best=0.61, avg=0.60, std=0.00, steps=1.770e+08
2023-07-07 05:20:18,484 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 5500, best=0.61, avg=0.61, std=0.00, steps=1.803e+08
2023-07-07 05:20:47,996 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 5600, best=0.61, avg=0.61, std=0.00, steps=1.835e+08
2023-07-07 05:21:17,472 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 5700, best=0.62, avg=0.61, std=0.00, steps=1.868e+08
2023-07-07 05:21:46,939 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 5800, best=0.62, avg=0.61, std=0.00, steps=1.901e+08
2023-07-07 05:22:16,490 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 5900, best=0.62, avg=0.61, std=0.00, steps=1.934e+08
2023-07-07 05:22:46,117 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 6000, best=0.62, avg=0.61, std=0.00, steps=1.966e+08
2023-07-07 05:23:15,599 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 6100, best=0.62, avg=0.62, std=0.00, steps=1.999e+08
2023-07-07 05:23:45,172 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 6200, best=0.62, avg=0.62, std=0.00, steps=2.032e+08
2023-07-07 05:24:14,739 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 6300, best=0.62, avg=0.62, std=0.00, steps=2.065e+08
2023-07-07 05:24:44,261 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 6400, best=0.62, avg=0.62, std=0.00, steps=2.097e+08
2023-07-07 05:25:13,765 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 6500, best=0.62, avg=0.62, std=0.00, steps=2.130e+08
2023-07-07 05:25:43,404 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 6600, best=0.63, avg=0.62, std=0.00, steps=2.163e+08
2023-07-07 05:26:12,843 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 6700, best=0.63, avg=0.62, std=0.00, steps=2.196e+08
2023-07-07 05:26:42,368 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 6800, best=0.63, avg=0.62, std=0.00, steps=2.229e+08
2023-07-07 05:27:12,066 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 6900, best=0.63, avg=0.63, std=0.00, steps=2.261e+08
2023-07-07 05:27:41,681 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 7000, best=0.63, avg=0.63, std=0.00, steps=2.294e+08
2023-07-07 05:28:11,331 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 7100, best=0.63, avg=0.63, std=0.00, steps=2.327e+08
2023-07-07 05:28:40,905 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 7200, best=0.63, avg=0.63, std=0.00, steps=2.360e+08
2023-07-07 05:29:10,378 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 7300, best=0.64, avg=0.63, std=0.00, steps=2.392e+08
2023-07-07 05:29:40,014 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 7400, best=0.63, avg=0.63, std=0.00, steps=2.425e+08
2023-07-07 05:30:09,561 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 7500, best=0.64, avg=0.63, std=0.00, steps=2.458e+08
2023-07-07 05:30:39,031 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 7600, best=0.64, avg=0.63, std=0.00, steps=2.491e+08
2023-07-07 05:31:08,683 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 7700, best=0.64, avg=0.63, std=0.00, steps=2.523e+08
2023-07-07 05:31:38,386 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 7800, best=0.64, avg=0.63, std=0.00, steps=2.556e+08
2023-07-07 05:32:08,001 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 7900, best=0.64, avg=0.63, std=0.00, steps=2.589e+08
2023-07-07 05:32:37,619 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 8000, best=0.64, avg=0.63, std=0.00, steps=2.622e+08
2023-07-07 05:33:07,275 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 8100, best=0.64, avg=0.64, std=0.00, steps=2.655e+08
2023-07-07 05:33:36,901 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 8200, best=0.64, avg=0.64, std=0.00, steps=2.687e+08
2023-07-07 05:34:06,305 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 8300, best=0.64, avg=0.64, std=0.00, steps=2.720e+08
2023-07-07 05:34:35,891 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 8400, best=0.64, avg=0.64, std=0.00, steps=2.753e+08
2023-07-07 05:35:05,445 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 8500, best=0.64, avg=0.64, std=0.00, steps=2.786e+08
2023-07-07 05:35:34,971 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 8600, best=0.64, avg=0.64, std=0.00, steps=2.818e+08
2023-07-07 05:36:04,463 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 8700, best=0.64, avg=0.64, std=0.00, steps=2.851e+08
2023-07-07 05:36:33,975 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 8800, best=0.64, avg=0.64, std=0.00, steps=2.884e+08
2023-07-07 05:37:03,431 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 8900, best=0.65, avg=0.64, std=0.00, steps=2.917e+08
2023-07-07 05:37:33,079 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 9000, best=0.65, avg=0.64, std=0.00, steps=2.949e+08
2023-07-07 05:38:02,614 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 9100, best=0.65, avg=0.64, std=0.00, steps=2.982e+08
2023-07-07 05:38:32,019 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 9200, best=0.65, avg=0.64, std=0.00, steps=3.015e+08
2023-07-07 05:39:01,560 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 9300, best=0.65, avg=0.64, std=0.00, steps=3.048e+08
2023-07-07 05:39:31,237 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 9400, best=0.65, avg=0.64, std=0.00, steps=3.081e+08
2023-07-07 05:40:00,863 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 9500, best=0.65, avg=0.64, std=0.00, steps=3.113e+08
2023-07-07 05:40:30,538 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 9600, best=0.65, avg=0.64, std=0.00, steps=3.146e+08
2023-07-07 05:41:00,133 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 9700, best=0.65, avg=0.64, std=0.00, steps=3.179e+08
2023-07-07 05:41:29,678 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 9800, best=0.65, avg=0.64, std=0.00, steps=3.212e+08
2023-07-07 05:41:59,299 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 9900, best=0.65, avg=0.64, std=0.00, steps=3.244e+08
2023-07-07 05:42:28,848 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 10000, best=0.65, avg=0.65, std=0.00, steps=3.277e+08
2023-07-07 05:42:58,423 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 10100, best=0.65, avg=0.65, std=0.00, steps=3.310e+08
2023-07-07 05:43:28,042 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 10200, best=0.65, avg=0.65, std=0.00, steps=3.343e+08
2023-07-07 05:43:57,710 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 10300, best=0.65, avg=0.65, std=0.00, steps=3.375e+08
2023-07-07 05:44:27,242 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 10400, best=0.65, avg=0.65, std=0.00, steps=3.408e+08
2023-07-07 05:44:56,831 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 10500, best=0.65, avg=0.65, std=0.00, steps=3.441e+08
2023-07-07 05:45:26,322 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 10600, best=0.65, avg=0.65, std=0.00, steps=3.474e+08
2023-07-07 05:45:55,877 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 10700, best=0.65, avg=0.65, std=0.00, steps=3.507e+08
2023-07-07 05:46:25,422 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 10800, best=0.65, avg=0.65, std=0.00, steps=3.539e+08
2023-07-07 05:46:54,898 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 10900, best=0.65, avg=0.65, std=0.00, steps=3.572e+08
2023-07-07 05:47:24,331 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 11000, best=0.65, avg=0.65, std=0.00, steps=3.605e+08
2023-07-07 05:47:53,863 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 11100, best=0.66, avg=0.65, std=0.00, steps=3.638e+08
2023-07-07 05:48:23,387 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 11200, best=0.65, avg=0.65, std=0.00, steps=3.670e+08
2023-07-07 05:48:52,969 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 11300, best=0.66, avg=0.65, std=0.00, steps=3.703e+08
2023-07-07 05:49:22,635 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 11400, best=0.65, avg=0.65, std=0.00, steps=3.736e+08
2023-07-07 05:49:52,305 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 11500, best=0.65, avg=0.65, std=0.00, steps=3.769e+08
2023-07-07 05:50:21,770 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 11600, best=0.66, avg=0.65, std=0.00, steps=3.801e+08
2023-07-07 05:50:51,356 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 11700, best=0.66, avg=0.65, std=0.00, steps=3.834e+08
2023-07-07 05:51:20,835 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 11800, best=0.66, avg=0.65, std=0.00, steps=3.867e+08
2023-07-07 05:51:50,365 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 11900, best=0.66, avg=0.65, std=0.00, steps=3.900e+08
2023-07-07 05:52:19,657 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 0, 0, [Train]: 11999, best=0.66, avg=0.65, std=0.00, steps=3.932e+08
2023-07-07 05:52:19,657 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 05:52:19,682 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 05:52:19,716 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 05:52:53,431 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 100, best=0.51, avg=0.50, std=0.00, steps=3.516e+06
2023-07-07 05:53:24,900 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 200, best=0.57, avg=0.57, std=0.00, steps=6.998e+06
2023-07-07 05:53:56,378 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 300, best=0.57, avg=0.57, std=0.00, steps=1.048e+07
2023-07-07 05:54:27,810 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 400, best=0.57, avg=0.57, std=0.00, steps=1.396e+07
2023-07-07 05:54:59,196 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 500, best=0.58, avg=0.57, std=0.00, steps=1.744e+07
2023-07-07 05:55:30,491 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 600, best=0.58, avg=0.57, std=0.00, steps=2.092e+07
2023-07-07 05:56:01,925 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 700, best=0.58, avg=0.57, std=0.00, steps=2.441e+07
2023-07-07 05:56:33,337 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 800, best=0.58, avg=0.58, std=0.00, steps=2.789e+07
2023-07-07 05:57:04,930 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 900, best=0.58, avg=0.58, std=0.00, steps=3.137e+07
2023-07-07 05:57:36,474 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 1000, best=0.59, avg=0.58, std=0.00, steps=3.485e+07
2023-07-07 05:58:07,938 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 1100, best=0.59, avg=0.59, std=0.00, steps=3.833e+07
2023-07-07 05:58:39,260 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 1200, best=0.60, avg=0.59, std=0.00, steps=4.181e+07
2023-07-07 05:59:10,681 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 1300, best=0.60, avg=0.59, std=0.00, steps=4.530e+07
2023-07-07 05:59:42,044 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 1400, best=0.60, avg=0.60, std=0.00, steps=4.878e+07
2023-07-07 06:00:13,422 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 1500, best=0.60, avg=0.60, std=0.00, steps=5.226e+07
2023-07-07 06:00:44,906 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 1600, best=0.60, avg=0.60, std=0.00, steps=5.574e+07
2023-07-07 06:01:16,247 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 1700, best=0.60, avg=0.60, std=0.00, steps=5.922e+07
2023-07-07 06:01:47,479 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 1800, best=0.60, avg=0.60, std=0.00, steps=6.270e+07
2023-07-07 06:02:18,731 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 1900, best=0.60, avg=0.60, std=0.00, steps=6.619e+07
2023-07-07 06:02:50,143 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 2000, best=0.60, avg=0.60, std=0.00, steps=6.967e+07
2023-07-07 06:03:21,533 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 2100, best=0.60, avg=0.60, std=0.00, steps=7.315e+07
2023-07-07 06:03:53,061 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 2200, best=0.61, avg=0.60, std=0.00, steps=7.663e+07
2023-07-07 06:04:24,498 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 2300, best=0.61, avg=0.60, std=0.00, steps=8.011e+07
2023-07-07 06:04:55,924 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 2400, best=0.61, avg=0.60, std=0.00, steps=8.359e+07
2023-07-07 06:05:27,309 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 2500, best=0.61, avg=0.60, std=0.00, steps=8.707e+07
2023-07-07 06:05:58,616 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 2600, best=0.61, avg=0.60, std=0.00, steps=9.056e+07
2023-07-07 06:06:29,832 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 2700, best=0.61, avg=0.60, std=0.00, steps=9.404e+07
2023-07-07 06:07:01,119 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 2800, best=0.61, avg=0.60, std=0.00, steps=9.752e+07
2023-07-07 06:07:32,484 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 2900, best=0.61, avg=0.60, std=0.00, steps=1.010e+08
2023-07-07 06:08:03,796 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 3000, best=0.61, avg=0.60, std=0.00, steps=1.045e+08
2023-07-07 06:08:35,082 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 3100, best=0.61, avg=0.60, std=0.00, steps=1.080e+08
2023-07-07 06:09:06,393 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 3200, best=0.61, avg=0.60, std=0.00, steps=1.114e+08
2023-07-07 06:09:37,821 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 3300, best=0.61, avg=0.60, std=0.00, steps=1.149e+08
2023-07-07 06:10:09,612 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 3400, best=0.61, avg=0.60, std=0.00, steps=1.184e+08
2023-07-07 06:10:41,108 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 3500, best=0.61, avg=0.60, std=0.00, steps=1.219e+08
2023-07-07 06:11:12,477 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 3600, best=0.61, avg=0.60, std=0.00, steps=1.254e+08
2023-07-07 06:11:43,784 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 3700, best=0.61, avg=0.60, std=0.00, steps=1.289e+08
2023-07-07 06:12:15,100 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 3800, best=0.61, avg=0.60, std=0.00, steps=1.323e+08
2023-07-07 06:12:46,391 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 3900, best=0.61, avg=0.60, std=0.00, steps=1.358e+08
2023-07-07 06:13:17,680 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 4000, best=0.61, avg=0.60, std=0.00, steps=1.393e+08
2023-07-07 06:13:49,004 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 4100, best=0.61, avg=0.60, std=0.00, steps=1.428e+08
2023-07-07 06:14:20,318 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 4200, best=0.61, avg=0.60, std=0.00, steps=1.463e+08
2023-07-07 06:14:51,660 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 4300, best=0.61, avg=0.61, std=0.00, steps=1.497e+08
2023-07-07 06:15:23,006 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 4400, best=0.61, avg=0.61, std=0.00, steps=1.532e+08
2023-07-07 06:15:54,330 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 4500, best=0.61, avg=0.61, std=0.00, steps=1.567e+08
2023-07-07 06:16:25,657 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 4600, best=0.61, avg=0.61, std=0.00, steps=1.602e+08
2023-07-07 06:16:56,886 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 4700, best=0.61, avg=0.61, std=0.00, steps=1.637e+08
2023-07-07 06:17:28,244 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 4800, best=0.61, avg=0.61, std=0.00, steps=1.672e+08
2023-07-07 06:17:59,576 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 4900, best=0.61, avg=0.61, std=0.00, steps=1.706e+08
2023-07-07 06:18:30,948 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 5000, best=0.61, avg=0.61, std=0.00, steps=1.741e+08
2023-07-07 06:19:02,233 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 5100, best=0.61, avg=0.61, std=0.00, steps=1.776e+08
2023-07-07 06:19:33,545 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 5200, best=0.62, avg=0.61, std=0.00, steps=1.811e+08
2023-07-07 06:20:04,883 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 5300, best=0.61, avg=0.61, std=0.00, steps=1.846e+08
2023-07-07 06:20:36,245 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 5400, best=0.61, avg=0.61, std=0.00, steps=1.880e+08
2023-07-07 06:21:07,650 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 5500, best=0.62, avg=0.61, std=0.00, steps=1.915e+08
2023-07-07 06:21:38,913 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 5600, best=0.62, avg=0.61, std=0.00, steps=1.950e+08
2023-07-07 06:22:10,308 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 5700, best=0.62, avg=0.61, std=0.00, steps=1.985e+08
2023-07-07 06:22:41,868 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 5800, best=0.62, avg=0.61, std=0.00, steps=2.020e+08
2023-07-07 06:23:13,184 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 5900, best=0.62, avg=0.61, std=0.00, steps=2.054e+08
2023-07-07 06:23:44,629 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 6000, best=0.62, avg=0.62, std=0.00, steps=2.089e+08
2023-07-07 06:24:16,108 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 6100, best=0.62, avg=0.62, std=0.00, steps=2.124e+08
2023-07-07 06:24:47,620 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 6200, best=0.62, avg=0.62, std=0.00, steps=2.159e+08
2023-07-07 06:25:19,045 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 6300, best=0.63, avg=0.62, std=0.00, steps=2.194e+08
2023-07-07 06:25:50,413 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 6400, best=0.63, avg=0.62, std=0.00, steps=2.229e+08
2023-07-07 06:26:21,747 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 6500, best=0.63, avg=0.62, std=0.00, steps=2.263e+08
2023-07-07 06:26:53,129 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 6600, best=0.63, avg=0.62, std=0.00, steps=2.298e+08
2023-07-07 06:27:24,469 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 6700, best=0.63, avg=0.62, std=0.00, steps=2.333e+08
2023-07-07 06:27:55,890 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 6800, best=0.63, avg=0.62, std=0.00, steps=2.368e+08
2023-07-07 06:28:27,154 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 6900, best=0.63, avg=0.63, std=0.00, steps=2.403e+08
2023-07-07 06:28:58,716 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 7000, best=0.63, avg=0.63, std=0.00, steps=2.437e+08
2023-07-07 06:29:29,960 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 7100, best=0.63, avg=0.63, std=0.00, steps=2.472e+08
2023-07-07 06:30:01,176 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 7200, best=0.63, avg=0.63, std=0.00, steps=2.507e+08
2023-07-07 06:30:32,514 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 7300, best=0.64, avg=0.63, std=0.00, steps=2.542e+08
2023-07-07 06:31:03,968 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 7400, best=0.64, avg=0.63, std=0.00, steps=2.577e+08
2023-07-07 06:31:35,405 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 7500, best=0.64, avg=0.63, std=0.00, steps=2.612e+08
2023-07-07 06:32:06,649 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 7600, best=0.64, avg=0.63, std=0.00, steps=2.646e+08
2023-07-07 06:32:38,088 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 7700, best=0.64, avg=0.63, std=0.00, steps=2.681e+08
2023-07-07 06:33:09,587 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 7800, best=0.64, avg=0.63, std=0.00, steps=2.716e+08
2023-07-07 06:33:40,913 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 7900, best=0.64, avg=0.63, std=0.00, steps=2.751e+08
2023-07-07 06:34:12,170 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 8000, best=0.64, avg=0.63, std=0.00, steps=2.786e+08
2023-07-07 06:34:43,596 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 8100, best=0.64, avg=0.63, std=0.00, steps=2.820e+08
2023-07-07 06:35:15,076 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 8200, best=0.64, avg=0.63, std=0.00, steps=2.855e+08
2023-07-07 06:35:46,411 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 8300, best=0.64, avg=0.64, std=0.00, steps=2.890e+08
2023-07-07 06:36:17,758 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 8400, best=0.64, avg=0.64, std=0.00, steps=2.925e+08
2023-07-07 06:36:49,086 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 8500, best=0.64, avg=0.64, std=0.00, steps=2.960e+08
2023-07-07 06:37:20,544 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 8600, best=0.64, avg=0.64, std=0.00, steps=2.995e+08
2023-07-07 06:37:51,934 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 8700, best=0.64, avg=0.64, std=0.00, steps=3.029e+08
2023-07-07 06:38:23,174 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 8800, best=0.64, avg=0.64, std=0.00, steps=3.064e+08
2023-07-07 06:38:54,469 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 8900, best=0.64, avg=0.64, std=0.00, steps=3.099e+08
2023-07-07 06:39:25,906 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 9000, best=0.64, avg=0.64, std=0.00, steps=3.134e+08
2023-07-07 06:39:57,444 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 9100, best=0.64, avg=0.64, std=0.00, steps=3.169e+08
2023-07-07 06:40:28,898 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 9200, best=0.64, avg=0.64, std=0.00, steps=3.203e+08
2023-07-07 06:41:00,198 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 9300, best=0.64, avg=0.64, std=0.00, steps=3.238e+08
2023-07-07 06:41:31,547 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 9400, best=0.65, avg=0.64, std=0.00, steps=3.273e+08
2023-07-07 06:42:02,945 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 9500, best=0.65, avg=0.64, std=0.00, steps=3.308e+08
2023-07-07 06:42:34,446 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 9600, best=0.64, avg=0.64, std=0.00, steps=3.343e+08
2023-07-07 06:43:05,905 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 9700, best=0.65, avg=0.64, std=0.00, steps=3.378e+08
2023-07-07 06:43:37,235 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 9800, best=0.65, avg=0.64, std=0.00, steps=3.412e+08
2023-07-07 06:44:08,576 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 9900, best=0.65, avg=0.64, std=0.00, steps=3.447e+08
2023-07-07 06:44:40,010 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 10000, best=0.65, avg=0.64, std=0.00, steps=3.482e+08
2023-07-07 06:45:11,393 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 10100, best=0.65, avg=0.64, std=0.00, steps=3.517e+08
2023-07-07 06:45:43,026 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 10200, best=0.65, avg=0.64, std=0.00, steps=3.552e+08
2023-07-07 06:46:14,455 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 10300, best=0.65, avg=0.64, std=0.00, steps=3.586e+08
2023-07-07 06:46:46,000 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 10400, best=0.65, avg=0.64, std=0.00, steps=3.621e+08
2023-07-07 06:47:17,499 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 10500, best=0.65, avg=0.64, std=0.00, steps=3.656e+08
2023-07-07 06:47:49,049 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 10600, best=0.65, avg=0.64, std=0.00, steps=3.691e+08
2023-07-07 06:48:20,537 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 10700, best=0.65, avg=0.64, std=0.00, steps=3.726e+08
2023-07-07 06:48:51,962 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 10800, best=0.65, avg=0.65, std=0.00, steps=3.760e+08
2023-07-07 06:49:23,345 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 10900, best=0.65, avg=0.65, std=0.00, steps=3.795e+08
2023-07-07 06:49:54,814 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 11000, best=0.65, avg=0.65, std=0.00, steps=3.830e+08
2023-07-07 06:50:26,145 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 11100, best=0.65, avg=0.65, std=0.00, steps=3.865e+08
2023-07-07 06:50:57,595 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 11200, best=0.65, avg=0.65, std=0.00, steps=3.900e+08
2023-07-07 06:51:29,088 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 11300, best=0.65, avg=0.65, std=0.00, steps=3.935e+08
2023-07-07 06:52:00,435 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 11400, best=0.65, avg=0.65, std=0.00, steps=3.969e+08
2023-07-07 06:52:31,743 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 11500, best=0.65, avg=0.65, std=0.00, steps=4.004e+08
2023-07-07 06:53:03,310 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 11600, best=0.66, avg=0.65, std=0.00, steps=4.039e+08
2023-07-07 06:53:34,802 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 11700, best=0.65, avg=0.65, std=0.00, steps=4.074e+08
2023-07-07 06:54:06,355 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 11800, best=0.66, avg=0.65, std=0.00, steps=4.109e+08
2023-07-07 06:54:37,821 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 11900, best=0.66, avg=0.65, std=0.00, steps=4.143e+08
2023-07-07 06:55:08,858 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 8, 0, [Train]: 11999, best=0.66, avg=0.65, std=0.00, steps=4.178e+08
2023-07-07 06:55:08,859 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 06:55:08,884 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 06:55:08,914 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 06:55:44,381 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 100, best=0.51, avg=0.50, std=0.00, steps=3.723e+06
2023-07-07 06:56:17,586 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 200, best=0.51, avg=0.50, std=0.00, steps=7.410e+06
2023-07-07 06:56:50,774 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 300, best=0.51, avg=0.50, std=0.00, steps=1.110e+07
2023-07-07 06:57:24,107 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 400, best=0.51, avg=0.50, std=0.00, steps=1.478e+07
2023-07-07 06:57:57,393 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 500, best=0.51, avg=0.50, std=0.00, steps=1.847e+07
2023-07-07 06:58:30,640 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 600, best=0.51, avg=0.50, std=0.00, steps=2.216e+07
2023-07-07 06:59:03,833 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 700, best=0.51, avg=0.50, std=0.00, steps=2.584e+07
2023-07-07 06:59:37,036 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 800, best=0.51, avg=0.50, std=0.00, steps=2.953e+07
2023-07-07 07:00:10,213 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 900, best=0.51, avg=0.50, std=0.00, steps=3.321e+07
2023-07-07 07:00:43,542 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 1000, best=0.51, avg=0.50, std=0.00, steps=3.690e+07
2023-07-07 07:01:16,750 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 1100, best=0.51, avg=0.50, std=0.00, steps=4.059e+07
2023-07-07 07:01:49,973 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 1200, best=0.51, avg=0.50, std=0.00, steps=4.427e+07
2023-07-07 07:02:23,165 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 1300, best=0.51, avg=0.50, std=0.00, steps=4.796e+07
2023-07-07 07:02:56,554 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 1400, best=0.51, avg=0.50, std=0.00, steps=5.165e+07
2023-07-07 07:03:29,717 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 1500, best=0.51, avg=0.50, std=0.00, steps=5.533e+07
2023-07-07 07:04:02,998 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 1600, best=0.51, avg=0.50, std=0.00, steps=5.902e+07
2023-07-07 07:04:36,166 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 1700, best=0.51, avg=0.50, std=0.00, steps=6.271e+07
2023-07-07 07:05:09,434 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 1800, best=0.51, avg=0.50, std=0.00, steps=6.639e+07
2023-07-07 07:05:42,674 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 1900, best=0.51, avg=0.50, std=0.00, steps=7.008e+07
2023-07-07 07:06:15,936 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 2000, best=0.51, avg=0.50, std=0.00, steps=7.376e+07
2023-07-07 07:06:49,120 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 2100, best=0.51, avg=0.50, std=0.00, steps=7.745e+07
2023-07-07 07:07:22,460 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 2200, best=0.51, avg=0.50, std=0.00, steps=8.114e+07
2023-07-07 07:07:55,580 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 2300, best=0.51, avg=0.50, std=0.00, steps=8.482e+07
2023-07-07 07:08:28,821 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 2400, best=0.51, avg=0.50, std=0.00, steps=8.851e+07
2023-07-07 07:09:02,029 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 2500, best=0.54, avg=0.53, std=0.00, steps=9.220e+07
2023-07-07 07:09:35,280 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 2600, best=0.56, avg=0.55, std=0.00, steps=9.588e+07
2023-07-07 07:10:08,479 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 2700, best=0.57, avg=0.56, std=0.00, steps=9.957e+07
2023-07-07 07:10:41,646 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 2800, best=0.57, avg=0.57, std=0.00, steps=1.033e+08
2023-07-07 07:11:14,785 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 2900, best=0.58, avg=0.57, std=0.00, steps=1.069e+08
2023-07-07 07:11:47,987 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 3000, best=0.58, avg=0.58, std=0.00, steps=1.106e+08
2023-07-07 07:12:21,242 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 3100, best=0.58, avg=0.58, std=0.00, steps=1.143e+08
2023-07-07 07:12:54,589 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 3200, best=0.58, avg=0.58, std=0.00, steps=1.180e+08
2023-07-07 07:13:27,952 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 3300, best=0.59, avg=0.58, std=0.00, steps=1.217e+08
2023-07-07 07:14:01,111 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 3400, best=0.59, avg=0.58, std=0.00, steps=1.254e+08
2023-07-07 07:14:34,296 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 3500, best=0.59, avg=0.59, std=0.00, steps=1.291e+08
2023-07-07 07:15:07,465 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 3600, best=0.59, avg=0.59, std=0.00, steps=1.327e+08
2023-07-07 07:15:40,604 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 3700, best=0.59, avg=0.59, std=0.00, steps=1.364e+08
2023-07-07 07:16:13,730 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 3800, best=0.60, avg=0.59, std=0.00, steps=1.401e+08
2023-07-07 07:16:46,872 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 3900, best=0.60, avg=0.59, std=0.00, steps=1.438e+08
2023-07-07 07:17:20,006 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 4000, best=0.60, avg=0.59, std=0.00, steps=1.475e+08
2023-07-07 07:17:53,161 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 4100, best=0.60, avg=0.59, std=0.00, steps=1.512e+08
2023-07-07 07:18:26,277 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 4200, best=0.60, avg=0.59, std=0.00, steps=1.549e+08
2023-07-07 07:18:59,479 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 4300, best=0.60, avg=0.60, std=0.00, steps=1.586e+08
2023-07-07 07:19:32,597 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 4400, best=0.60, avg=0.60, std=0.00, steps=1.622e+08
2023-07-07 07:20:05,873 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 4500, best=0.60, avg=0.60, std=0.00, steps=1.659e+08
2023-07-07 07:20:39,114 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 4600, best=0.60, avg=0.60, std=0.00, steps=1.696e+08
2023-07-07 07:21:12,465 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 4700, best=0.60, avg=0.60, std=0.00, steps=1.733e+08
2023-07-07 07:21:45,779 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 4800, best=0.60, avg=0.60, std=0.00, steps=1.770e+08
2023-07-07 07:22:19,171 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 4900, best=0.60, avg=0.60, std=0.00, steps=1.807e+08
2023-07-07 07:22:52,376 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 5000, best=0.60, avg=0.60, std=0.00, steps=1.844e+08
2023-07-07 07:23:25,634 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 5100, best=0.61, avg=0.60, std=0.00, steps=1.880e+08
2023-07-07 07:23:58,887 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 5200, best=0.61, avg=0.60, std=0.00, steps=1.917e+08
2023-07-07 07:24:32,130 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 5300, best=0.61, avg=0.60, std=0.00, steps=1.954e+08
2023-07-07 07:25:05,260 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 5400, best=0.61, avg=0.60, std=0.00, steps=1.991e+08
2023-07-07 07:25:38,489 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 5500, best=0.61, avg=0.60, std=0.00, steps=2.028e+08
2023-07-07 07:26:11,782 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 5600, best=0.61, avg=0.61, std=0.00, steps=2.065e+08
2023-07-07 07:26:45,146 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 5700, best=0.61, avg=0.61, std=0.00, steps=2.102e+08
2023-07-07 07:27:18,347 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 5800, best=0.61, avg=0.61, std=0.00, steps=2.138e+08
2023-07-07 07:27:51,473 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 5900, best=0.61, avg=0.61, std=0.00, steps=2.175e+08
2023-07-07 07:28:24,852 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 6000, best=0.61, avg=0.61, std=0.00, steps=2.212e+08
2023-07-07 07:28:58,006 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 6100, best=0.61, avg=0.61, std=0.00, steps=2.249e+08
2023-07-07 07:29:31,281 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 6200, best=0.61, avg=0.61, std=0.00, steps=2.286e+08
2023-07-07 07:30:04,452 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 6300, best=0.62, avg=0.61, std=0.00, steps=2.323e+08
2023-07-07 07:30:37,617 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 6400, best=0.61, avg=0.61, std=0.00, steps=2.360e+08
2023-07-07 07:31:10,795 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 6500, best=0.61, avg=0.61, std=0.00, steps=2.397e+08
2023-07-07 07:31:43,864 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 6600, best=0.62, avg=0.61, std=0.00, steps=2.433e+08
2023-07-07 07:32:17,108 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 6700, best=0.62, avg=0.61, std=0.00, steps=2.470e+08
2023-07-07 07:32:50,589 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 6800, best=0.62, avg=0.61, std=0.00, steps=2.507e+08
2023-07-07 07:33:23,885 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 6900, best=0.62, avg=0.61, std=0.00, steps=2.544e+08
2023-07-07 07:33:57,052 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 7000, best=0.62, avg=0.61, std=0.00, steps=2.581e+08
2023-07-07 07:34:30,129 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 7100, best=0.62, avg=0.61, std=0.00, steps=2.618e+08
2023-07-07 07:35:03,322 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 7200, best=0.62, avg=0.61, std=0.00, steps=2.655e+08
2023-07-07 07:35:36,460 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 7300, best=0.62, avg=0.61, std=0.00, steps=2.691e+08
2023-07-07 07:36:09,566 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 7400, best=0.62, avg=0.62, std=0.00, steps=2.728e+08
2023-07-07 07:36:42,665 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 7500, best=0.62, avg=0.62, std=0.00, steps=2.765e+08
2023-07-07 07:37:15,811 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 7600, best=0.62, avg=0.62, std=0.00, steps=2.802e+08
2023-07-07 07:37:48,926 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 7700, best=0.62, avg=0.62, std=0.00, steps=2.839e+08
2023-07-07 07:38:22,352 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 7800, best=0.62, avg=0.62, std=0.00, steps=2.876e+08
2023-07-07 07:38:55,687 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 7900, best=0.62, avg=0.62, std=0.00, steps=2.913e+08
2023-07-07 07:39:28,776 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 8000, best=0.62, avg=0.62, std=0.00, steps=2.949e+08
2023-07-07 07:40:01,953 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 8100, best=0.62, avg=0.62, std=0.00, steps=2.986e+08
2023-07-07 07:40:35,133 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 8200, best=0.62, avg=0.62, std=0.00, steps=3.023e+08
2023-07-07 07:41:08,480 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 8300, best=0.62, avg=0.62, std=0.00, steps=3.060e+08
2023-07-07 07:41:41,856 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 8400, best=0.62, avg=0.62, std=0.00, steps=3.097e+08
2023-07-07 07:42:15,114 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 8500, best=0.62, avg=0.62, std=0.00, steps=3.134e+08
2023-07-07 07:42:48,417 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 8600, best=0.62, avg=0.62, std=0.00, steps=3.171e+08
2023-07-07 07:43:21,623 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 8700, best=0.62, avg=0.62, std=0.00, steps=3.208e+08
2023-07-07 07:43:54,849 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 8800, best=0.62, avg=0.62, std=0.00, steps=3.244e+08
2023-07-07 07:44:27,966 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 8900, best=0.63, avg=0.62, std=0.00, steps=3.281e+08
2023-07-07 07:45:01,291 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 9000, best=0.62, avg=0.62, std=0.00, steps=3.318e+08
2023-07-07 07:45:34,517 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 9100, best=0.63, avg=0.62, std=0.00, steps=3.355e+08
2023-07-07 07:46:07,906 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 9200, best=0.63, avg=0.62, std=0.00, steps=3.392e+08
2023-07-07 07:46:41,118 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 9300, best=0.63, avg=0.62, std=0.00, steps=3.429e+08
2023-07-07 07:47:14,487 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 9400, best=0.62, avg=0.62, std=0.00, steps=3.466e+08
2023-07-07 07:47:47,591 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 9500, best=0.62, avg=0.62, std=0.00, steps=3.502e+08
2023-07-07 07:48:20,984 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 9600, best=0.62, avg=0.62, std=0.00, steps=3.539e+08
2023-07-07 07:48:54,078 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 9700, best=0.62, avg=0.62, std=0.00, steps=3.576e+08
2023-07-07 07:49:27,262 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 9800, best=0.63, avg=0.62, std=0.00, steps=3.613e+08
2023-07-07 07:50:00,518 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 9900, best=0.63, avg=0.62, std=0.00, steps=3.650e+08
2023-07-07 07:50:33,837 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 10000, best=0.63, avg=0.62, std=0.00, steps=3.687e+08
2023-07-07 07:51:07,120 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 10100, best=0.63, avg=0.62, std=0.00, steps=3.724e+08
2023-07-07 07:51:40,318 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 10200, best=0.63, avg=0.62, std=0.00, steps=3.760e+08
2023-07-07 07:52:13,593 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 10300, best=0.63, avg=0.62, std=0.00, steps=3.797e+08
2023-07-07 07:52:46,708 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 10400, best=0.63, avg=0.62, std=0.00, steps=3.834e+08
2023-07-07 07:53:19,859 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 10500, best=0.63, avg=0.62, std=0.00, steps=3.871e+08
2023-07-07 07:53:53,043 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 10600, best=0.63, avg=0.62, std=0.00, steps=3.908e+08
2023-07-07 07:54:26,260 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 10700, best=0.63, avg=0.62, std=0.00, steps=3.945e+08
2023-07-07 07:54:59,340 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 10800, best=0.63, avg=0.62, std=0.00, steps=3.982e+08
2023-07-07 07:55:32,570 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 10900, best=0.63, avg=0.62, std=0.00, steps=4.019e+08
2023-07-07 07:56:05,868 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 11000, best=0.63, avg=0.62, std=0.00, steps=4.055e+08
2023-07-07 07:56:39,100 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 11100, best=0.63, avg=0.62, std=0.00, steps=4.092e+08
2023-07-07 07:57:12,361 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 11200, best=0.63, avg=0.62, std=0.00, steps=4.129e+08
2023-07-07 07:57:45,494 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 11300, best=0.63, avg=0.62, std=0.00, steps=4.166e+08
2023-07-07 07:58:18,873 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 11400, best=0.63, avg=0.62, std=0.00, steps=4.203e+08
2023-07-07 07:58:52,273 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 11500, best=0.63, avg=0.62, std=0.00, steps=4.240e+08
2023-07-07 07:59:25,586 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 11600, best=0.63, avg=0.62, std=0.00, steps=4.277e+08
2023-07-07 07:59:58,965 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 11700, best=0.63, avg=0.62, std=0.00, steps=4.313e+08
2023-07-07 08:00:32,074 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 11800, best=0.63, avg=0.63, std=0.00, steps=4.350e+08
2023-07-07 08:01:05,217 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 11900, best=0.63, avg=0.63, std=0.00, steps=4.387e+08
2023-07-07 08:01:37,991 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 16, 0, [Train]: 11999, best=0.63, avg=0.63, std=0.00, steps=4.424e+08
2023-07-07 08:01:37,991 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 08:01:38,016 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 08:01:38,047 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 08:02:17,298 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 100, best=0.51, avg=0.50, std=0.00, steps=4.137e+06
2023-07-07 08:02:54,048 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 200, best=0.51, avg=0.50, std=0.00, steps=8.233e+06
2023-07-07 08:03:30,968 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 300, best=0.51, avg=0.50, std=0.00, steps=1.233e+07
2023-07-07 08:04:08,155 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 400, best=0.51, avg=0.50, std=0.00, steps=1.642e+07
2023-07-07 08:04:45,192 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 500, best=0.51, avg=0.50, std=0.00, steps=2.052e+07
2023-07-07 08:05:22,041 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 600, best=0.51, avg=0.50, std=0.00, steps=2.462e+07
2023-07-07 08:05:58,922 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 700, best=0.51, avg=0.50, std=0.00, steps=2.871e+07
2023-07-07 08:06:35,950 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 800, best=0.51, avg=0.50, std=0.00, steps=3.281e+07
2023-07-07 08:07:12,688 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 900, best=0.51, avg=0.50, std=0.00, steps=3.690e+07
2023-07-07 08:07:49,394 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 1000, best=0.51, avg=0.50, std=0.00, steps=4.100e+07
2023-07-07 08:08:26,239 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 1100, best=0.51, avg=0.50, std=0.00, steps=4.510e+07
2023-07-07 08:09:03,039 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 1200, best=0.51, avg=0.50, std=0.00, steps=4.919e+07
2023-07-07 08:09:39,845 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 1300, best=0.51, avg=0.50, std=0.00, steps=5.329e+07
2023-07-07 08:10:16,732 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 1400, best=0.51, avg=0.50, std=0.00, steps=5.738e+07
2023-07-07 08:10:53,525 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 1500, best=0.51, avg=0.50, std=0.00, steps=6.148e+07
2023-07-07 08:11:30,325 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 1600, best=0.51, avg=0.50, std=0.00, steps=6.558e+07
2023-07-07 08:12:07,106 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 1700, best=0.51, avg=0.50, std=0.00, steps=6.967e+07
2023-07-07 08:12:43,957 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 1800, best=0.51, avg=0.50, std=0.00, steps=7.377e+07
2023-07-07 08:13:20,730 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 1900, best=0.51, avg=0.50, std=0.00, steps=7.786e+07
2023-07-07 08:13:57,624 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 2000, best=0.51, avg=0.50, std=0.00, steps=8.196e+07
2023-07-07 08:14:34,643 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 2100, best=0.51, avg=0.50, std=0.00, steps=8.606e+07
2023-07-07 08:15:11,656 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 2200, best=0.51, avg=0.50, std=0.00, steps=9.015e+07
2023-07-07 08:15:48,643 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 2300, best=0.51, avg=0.50, std=0.00, steps=9.425e+07
2023-07-07 08:16:25,634 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 2400, best=0.51, avg=0.50, std=0.00, steps=9.834e+07
2023-07-07 08:17:02,674 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 2500, best=0.51, avg=0.50, std=0.00, steps=1.024e+08
2023-07-07 08:17:39,727 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 2600, best=0.51, avg=0.50, std=0.00, steps=1.065e+08
2023-07-07 08:18:16,835 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 2700, best=0.51, avg=0.50, std=0.00, steps=1.106e+08
2023-07-07 08:18:53,704 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 2800, best=0.51, avg=0.50, std=0.00, steps=1.147e+08
2023-07-07 08:19:30,701 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 2900, best=0.51, avg=0.50, std=0.00, steps=1.188e+08
2023-07-07 08:20:07,714 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 3000, best=0.51, avg=0.50, std=0.00, steps=1.229e+08
2023-07-07 08:20:44,755 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 3100, best=0.51, avg=0.50, std=0.00, steps=1.270e+08
2023-07-07 08:21:21,932 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 3200, best=0.50, avg=0.50, std=0.00, steps=1.311e+08
2023-07-07 08:21:58,848 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 3300, best=0.51, avg=0.50, std=0.00, steps=1.352e+08
2023-07-07 08:22:35,794 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 3400, best=0.51, avg=0.50, std=0.00, steps=1.393e+08
2023-07-07 08:23:12,933 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 3500, best=0.51, avg=0.50, std=0.00, steps=1.434e+08
2023-07-07 08:23:50,088 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 3600, best=0.51, avg=0.50, std=0.00, steps=1.475e+08
2023-07-07 08:24:27,254 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 3700, best=0.51, avg=0.50, std=0.00, steps=1.516e+08
2023-07-07 08:25:04,273 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 3800, best=0.51, avg=0.50, std=0.00, steps=1.557e+08
2023-07-07 08:25:41,368 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 3900, best=0.51, avg=0.50, std=0.00, steps=1.598e+08
2023-07-07 08:26:18,390 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 4000, best=0.51, avg=0.50, std=0.00, steps=1.639e+08
2023-07-07 08:26:55,528 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 4100, best=0.51, avg=0.50, std=0.00, steps=1.680e+08
2023-07-07 08:27:32,612 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 4200, best=0.51, avg=0.50, std=0.00, steps=1.721e+08
2023-07-07 08:28:09,701 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 4300, best=0.51, avg=0.50, std=0.00, steps=1.762e+08
2023-07-07 08:28:46,632 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 4400, best=0.51, avg=0.50, std=0.00, steps=1.803e+08
2023-07-07 08:29:23,632 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 4500, best=0.51, avg=0.50, std=0.00, steps=1.844e+08
2023-07-07 08:30:00,650 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 4600, best=0.51, avg=0.50, std=0.00, steps=1.885e+08
2023-07-07 08:30:37,726 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 4700, best=0.51, avg=0.50, std=0.00, steps=1.926e+08
2023-07-07 08:31:14,717 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 4800, best=0.51, avg=0.50, std=0.00, steps=1.966e+08
2023-07-07 08:31:51,666 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 4900, best=0.51, avg=0.50, std=0.00, steps=2.007e+08
2023-07-07 08:32:28,731 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 5000, best=0.51, avg=0.50, std=0.00, steps=2.048e+08
2023-07-07 08:33:05,674 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 5100, best=0.51, avg=0.50, std=0.00, steps=2.089e+08
2023-07-07 08:33:42,683 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 5200, best=0.51, avg=0.50, std=0.00, steps=2.130e+08
2023-07-07 08:34:19,642 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 5300, best=0.51, avg=0.50, std=0.00, steps=2.171e+08
2023-07-07 08:34:56,735 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 5400, best=0.51, avg=0.50, std=0.00, steps=2.212e+08
2023-07-07 08:35:33,764 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 5500, best=0.55, avg=0.55, std=0.00, steps=2.253e+08
2023-07-07 08:36:11,044 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 5600, best=0.55, avg=0.55, std=0.00, steps=2.294e+08
2023-07-07 08:36:48,002 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 5700, best=0.55, avg=0.55, std=0.00, steps=2.335e+08
2023-07-07 08:37:25,005 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 5800, best=0.55, avg=0.55, std=0.00, steps=2.376e+08
2023-07-07 08:38:01,998 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 5900, best=0.55, avg=0.55, std=0.00, steps=2.417e+08
2023-07-07 08:38:39,190 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 6000, best=0.55, avg=0.55, std=0.00, steps=2.458e+08
2023-07-07 08:39:16,230 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 6100, best=0.55, avg=0.55, std=0.00, steps=2.499e+08
2023-07-07 08:39:53,339 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 6200, best=0.55, avg=0.55, std=0.00, steps=2.540e+08
2023-07-07 08:40:30,509 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 6300, best=0.55, avg=0.55, std=0.00, steps=2.581e+08
2023-07-07 08:41:07,575 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 6400, best=0.55, avg=0.55, std=0.00, steps=2.622e+08
2023-07-07 08:41:44,750 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 6500, best=0.55, avg=0.55, std=0.00, steps=2.663e+08
2023-07-07 08:42:21,921 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 6600, best=0.55, avg=0.55, std=0.00, steps=2.704e+08
2023-07-07 08:42:59,069 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 6700, best=0.55, avg=0.55, std=0.00, steps=2.745e+08
2023-07-07 08:43:36,250 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 6800, best=0.55, avg=0.55, std=0.00, steps=2.786e+08
2023-07-07 08:44:13,369 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 6900, best=0.55, avg=0.55, std=0.00, steps=2.827e+08
2023-07-07 08:44:50,590 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 7000, best=0.55, avg=0.55, std=0.00, steps=2.868e+08
2023-07-07 08:45:27,805 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 7100, best=0.56, avg=0.55, std=0.00, steps=2.909e+08
2023-07-07 08:46:05,004 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 7200, best=0.55, avg=0.55, std=0.00, steps=2.950e+08
2023-07-07 08:46:42,135 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 7300, best=0.55, avg=0.55, std=0.00, steps=2.990e+08
2023-07-07 08:47:19,253 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 7400, best=0.55, avg=0.55, std=0.00, steps=3.031e+08
2023-07-07 08:47:56,440 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 7500, best=0.55, avg=0.55, std=0.00, steps=3.072e+08
2023-07-07 08:48:33,565 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 7600, best=0.55, avg=0.55, std=0.00, steps=3.113e+08
2023-07-07 08:49:10,869 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 7700, best=0.55, avg=0.55, std=0.00, steps=3.154e+08
2023-07-07 08:49:47,974 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 7800, best=0.56, avg=0.55, std=0.00, steps=3.195e+08
2023-07-07 08:50:25,110 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 7900, best=0.55, avg=0.55, std=0.00, steps=3.236e+08
2023-07-07 08:51:02,345 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 8000, best=0.55, avg=0.55, std=0.00, steps=3.277e+08
2023-07-07 08:51:39,467 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 8100, best=0.55, avg=0.55, std=0.00, steps=3.318e+08
2023-07-07 08:52:16,687 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 8200, best=0.55, avg=0.55, std=0.00, steps=3.359e+08
2023-07-07 08:52:53,911 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 8300, best=0.55, avg=0.55, std=0.00, steps=3.400e+08
2023-07-07 08:53:31,046 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 8400, best=0.55, avg=0.55, std=0.00, steps=3.441e+08
2023-07-07 08:54:08,245 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 8500, best=0.55, avg=0.55, std=0.00, steps=3.482e+08
2023-07-07 08:54:45,384 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 8600, best=0.55, avg=0.55, std=0.00, steps=3.523e+08
2023-07-07 08:55:22,619 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 8700, best=0.55, avg=0.55, std=0.00, steps=3.564e+08
2023-07-07 08:55:59,777 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 8800, best=0.55, avg=0.55, std=0.00, steps=3.605e+08
2023-07-07 08:56:36,881 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 8900, best=0.56, avg=0.55, std=0.00, steps=3.646e+08
2023-07-07 08:57:14,344 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 9000, best=0.55, avg=0.55, std=0.00, steps=3.687e+08
2023-07-07 08:57:51,555 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 9100, best=0.55, avg=0.55, std=0.00, steps=3.728e+08
2023-07-07 08:58:28,809 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 9200, best=0.55, avg=0.55, std=0.00, steps=3.769e+08
2023-07-07 08:59:05,947 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 9300, best=0.55, avg=0.55, std=0.00, steps=3.810e+08
2023-07-07 08:59:43,106 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 9400, best=0.55, avg=0.55, std=0.00, steps=3.851e+08
2023-07-07 09:00:20,318 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 9500, best=0.55, avg=0.55, std=0.00, steps=3.892e+08
2023-07-07 09:00:57,414 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 9600, best=0.55, avg=0.55, std=0.00, steps=3.933e+08
2023-07-07 09:01:34,755 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 9700, best=0.55, avg=0.55, std=0.00, steps=3.974e+08
2023-07-07 09:02:11,908 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 9800, best=0.55, avg=0.55, std=0.00, steps=4.014e+08
2023-07-07 09:02:49,084 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 9900, best=0.55, avg=0.55, std=0.00, steps=4.055e+08
2023-07-07 09:03:26,338 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 10000, best=0.55, avg=0.55, std=0.00, steps=4.096e+08
2023-07-07 09:04:03,792 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 10100, best=0.55, avg=0.55, std=0.00, steps=4.137e+08
2023-07-07 09:04:40,870 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 10200, best=0.55, avg=0.55, std=0.00, steps=4.178e+08
2023-07-07 09:05:18,025 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 10300, best=0.56, avg=0.55, std=0.00, steps=4.219e+08
2023-07-07 09:05:55,331 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 10400, best=0.55, avg=0.55, std=0.00, steps=4.260e+08
2023-07-07 09:06:32,367 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 10500, best=0.55, avg=0.55, std=0.00, steps=4.301e+08
2023-07-07 09:07:09,427 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 10600, best=0.55, avg=0.55, std=0.00, steps=4.342e+08
2023-07-07 09:07:46,548 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 10700, best=0.55, avg=0.55, std=0.00, steps=4.383e+08
2023-07-07 09:08:23,776 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 10800, best=0.55, avg=0.55, std=0.00, steps=4.424e+08
2023-07-07 09:09:00,900 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 10900, best=0.55, avg=0.55, std=0.00, steps=4.465e+08
2023-07-07 09:09:38,040 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 11000, best=0.56, avg=0.55, std=0.00, steps=4.506e+08
2023-07-07 09:10:15,300 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 11100, best=0.55, avg=0.55, std=0.00, steps=4.547e+08
2023-07-07 09:10:52,415 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 11200, best=0.56, avg=0.55, std=0.00, steps=4.588e+08
2023-07-07 09:11:29,546 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 11300, best=0.56, avg=0.56, std=0.00, steps=4.629e+08
2023-07-07 09:12:06,783 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 11400, best=0.57, avg=0.56, std=0.00, steps=4.670e+08
2023-07-07 09:12:44,176 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 11500, best=0.57, avg=0.56, std=0.00, steps=4.711e+08
2023-07-07 09:13:21,290 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 11600, best=0.57, avg=0.56, std=0.00, steps=4.752e+08
2023-07-07 09:13:58,496 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 11700, best=0.57, avg=0.57, std=0.00, steps=4.793e+08
2023-07-07 09:14:35,689 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 11800, best=0.57, avg=0.57, std=0.00, steps=4.834e+08
2023-07-07 09:15:12,924 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 11900, best=0.57, avg=0.57, std=0.00, steps=4.875e+08
2023-07-07 09:15:49,734 -        meta learning: [    INFO] - [Len Lat Rep]: 64, 32, 0, [Train]: 11999, best=0.57, avg=0.57, std=0.00, steps=4.915e+08
2023-07-07 09:15:49,735 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 09:15:49,758 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 09:15:49,790 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 09:15:55,628 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 100, best=0.73, avg=0.71, std=0.01, steps=4.137e+05
2023-07-07 09:15:59,595 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 200, best=0.79, avg=0.78, std=0.01, steps=8.233e+05
2023-07-07 09:16:03,577 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 300, best=0.88, avg=0.86, std=0.01, steps=1.233e+06
2023-07-07 09:16:07,564 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 400, best=0.92, avg=0.90, std=0.01, steps=1.642e+06
2023-07-07 09:16:11,558 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 500, best=0.96, avg=0.95, std=0.00, steps=2.052e+06
2023-07-07 09:16:15,560 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 600, best=0.98, avg=0.97, std=0.00, steps=2.462e+06
2023-07-07 09:16:19,562 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 700, best=1.00, avg=0.99, std=0.00, steps=2.871e+06
2023-07-07 09:16:23,550 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 800, best=1.00, avg=1.00, std=0.00, steps=3.281e+06
2023-07-07 09:16:27,535 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 900, best=1.00, avg=1.00, std=0.00, steps=3.690e+06
2023-07-07 09:16:31,501 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 1000, best=1.00, avg=1.00, std=0.00, steps=4.100e+06
2023-07-07 09:16:35,469 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 1100, best=1.00, avg=1.00, std=0.00, steps=4.510e+06
2023-07-07 09:16:39,452 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 1200, best=1.00, avg=1.00, std=0.00, steps=4.919e+06
2023-07-07 09:16:43,430 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 1300, best=1.00, avg=1.00, std=0.00, steps=5.329e+06
2023-07-07 09:16:47,441 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 1400, best=1.00, avg=1.00, std=0.00, steps=5.738e+06
2023-07-07 09:16:51,437 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 1500, best=1.00, avg=1.00, std=0.00, steps=6.148e+06
2023-07-07 09:16:55,408 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 1600, best=1.00, avg=1.00, std=0.00, steps=6.558e+06
2023-07-07 09:16:59,377 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 1700, best=1.00, avg=1.00, std=0.00, steps=6.967e+06
2023-07-07 09:17:03,345 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 1800, best=1.00, avg=1.00, std=0.00, steps=7.377e+06
2023-07-07 09:17:07,325 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 1900, best=1.00, avg=1.00, std=0.00, steps=7.786e+06
2023-07-07 09:17:11,315 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 2000, best=1.00, avg=1.00, std=0.00, steps=8.196e+06
2023-07-07 09:17:15,296 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 2100, best=1.00, avg=1.00, std=0.00, steps=8.606e+06
2023-07-07 09:17:19,299 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 2200, best=1.00, avg=1.00, std=0.00, steps=9.015e+06
2023-07-07 09:17:23,294 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 2300, best=1.00, avg=1.00, std=0.00, steps=9.425e+06
2023-07-07 09:17:27,284 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 2400, best=1.00, avg=1.00, std=0.00, steps=9.834e+06
2023-07-07 09:17:31,287 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 2500, best=1.00, avg=1.00, std=0.00, steps=1.024e+07
2023-07-07 09:17:35,292 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 2600, best=1.00, avg=1.00, std=0.00, steps=1.065e+07
2023-07-07 09:17:39,278 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 2700, best=1.00, avg=1.00, std=0.00, steps=1.106e+07
2023-07-07 09:17:43,271 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 2800, best=1.00, avg=1.00, std=0.00, steps=1.147e+07
2023-07-07 09:17:47,268 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 2900, best=1.00, avg=1.00, std=0.00, steps=1.188e+07
2023-07-07 09:17:51,257 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 3000, best=1.00, avg=1.00, std=0.00, steps=1.229e+07
2023-07-07 09:17:55,264 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 3100, best=1.00, avg=1.00, std=0.00, steps=1.270e+07
2023-07-07 09:17:59,264 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 3200, best=1.00, avg=1.00, std=0.00, steps=1.311e+07
2023-07-07 09:18:03,266 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 3300, best=1.00, avg=1.00, std=0.00, steps=1.352e+07
2023-07-07 09:18:07,267 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 3400, best=1.00, avg=1.00, std=0.00, steps=1.393e+07
2023-07-07 09:18:11,261 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 3500, best=1.00, avg=1.00, std=0.00, steps=1.434e+07
2023-07-07 09:18:15,239 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 3600, best=1.00, avg=1.00, std=0.00, steps=1.475e+07
2023-07-07 09:18:19,234 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 3700, best=1.00, avg=1.00, std=0.00, steps=1.516e+07
2023-07-07 09:18:23,228 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 3800, best=1.00, avg=1.00, std=0.00, steps=1.557e+07
2023-07-07 09:18:27,216 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 3900, best=1.00, avg=1.00, std=0.00, steps=1.598e+07
2023-07-07 09:18:31,198 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 4000, best=1.00, avg=1.00, std=0.00, steps=1.639e+07
2023-07-07 09:18:35,184 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 4100, best=1.00, avg=1.00, std=0.00, steps=1.680e+07
2023-07-07 09:18:39,165 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 4200, best=1.00, avg=1.00, std=0.00, steps=1.721e+07
2023-07-07 09:18:43,138 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 4300, best=1.00, avg=1.00, std=0.00, steps=1.762e+07
2023-07-07 09:18:47,121 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 4400, best=1.00, avg=1.00, std=0.00, steps=1.803e+07
2023-07-07 09:18:51,106 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 4500, best=1.00, avg=1.00, std=0.00, steps=1.844e+07
2023-07-07 09:18:55,083 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 4600, best=1.00, avg=1.00, std=0.00, steps=1.885e+07
2023-07-07 09:18:59,068 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 4700, best=1.00, avg=1.00, std=0.00, steps=1.926e+07
2023-07-07 09:19:03,042 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 4800, best=1.00, avg=1.00, std=0.00, steps=1.966e+07
2023-07-07 09:19:07,025 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 4900, best=1.00, avg=1.00, std=0.00, steps=2.007e+07
2023-07-07 09:19:11,008 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 5000, best=1.00, avg=1.00, std=0.00, steps=2.048e+07
2023-07-07 09:19:14,972 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 5100, best=1.00, avg=1.00, std=0.00, steps=2.089e+07
2023-07-07 09:19:18,926 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 5200, best=1.00, avg=1.00, std=0.00, steps=2.130e+07
2023-07-07 09:19:22,893 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 5300, best=1.00, avg=1.00, std=0.00, steps=2.171e+07
2023-07-07 09:19:26,883 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 5400, best=1.00, avg=1.00, std=0.00, steps=2.212e+07
2023-07-07 09:19:30,849 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 5500, best=1.00, avg=1.00, std=0.00, steps=2.253e+07
2023-07-07 09:19:34,801 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 5600, best=1.00, avg=1.00, std=0.00, steps=2.294e+07
2023-07-07 09:19:38,779 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 5700, best=1.00, avg=1.00, std=0.00, steps=2.335e+07
2023-07-07 09:19:42,758 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 5800, best=1.00, avg=1.00, std=0.00, steps=2.376e+07
2023-07-07 09:19:46,760 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 5900, best=1.00, avg=1.00, std=0.00, steps=2.417e+07
2023-07-07 09:19:50,744 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 6000, best=1.00, avg=1.00, std=0.00, steps=2.458e+07
2023-07-07 09:19:54,724 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 6100, best=1.00, avg=1.00, std=0.00, steps=2.499e+07
2023-07-07 09:19:58,703 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 6200, best=1.00, avg=1.00, std=0.00, steps=2.540e+07
2023-07-07 09:20:02,678 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 6300, best=1.00, avg=1.00, std=0.00, steps=2.581e+07
2023-07-07 09:20:06,648 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 6400, best=1.00, avg=1.00, std=0.00, steps=2.622e+07
2023-07-07 09:20:10,634 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 6500, best=1.00, avg=1.00, std=0.00, steps=2.663e+07
2023-07-07 09:20:14,617 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 6600, best=1.00, avg=1.00, std=0.00, steps=2.704e+07
2023-07-07 09:20:18,588 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 6700, best=1.00, avg=1.00, std=0.00, steps=2.745e+07
2023-07-07 09:20:22,568 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 6800, best=1.00, avg=1.00, std=0.00, steps=2.786e+07
2023-07-07 09:20:26,535 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 6900, best=1.00, avg=1.00, std=0.00, steps=2.827e+07
2023-07-07 09:20:30,486 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 7000, best=1.00, avg=1.00, std=0.00, steps=2.868e+07
2023-07-07 09:20:34,458 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 7100, best=1.00, avg=1.00, std=0.00, steps=2.909e+07
2023-07-07 09:20:38,443 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 7200, best=1.00, avg=1.00, std=0.00, steps=2.950e+07
2023-07-07 09:20:42,419 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 7300, best=1.00, avg=1.00, std=0.00, steps=2.990e+07
2023-07-07 09:20:46,382 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 7400, best=1.00, avg=1.00, std=0.00, steps=3.031e+07
2023-07-07 09:20:50,348 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 7500, best=1.00, avg=1.00, std=0.00, steps=3.072e+07
2023-07-07 09:20:54,298 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 7600, best=1.00, avg=1.00, std=0.00, steps=3.113e+07
2023-07-07 09:20:58,265 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 7700, best=1.00, avg=1.00, std=0.00, steps=3.154e+07
2023-07-07 09:21:02,253 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 7800, best=1.00, avg=1.00, std=0.00, steps=3.195e+07
2023-07-07 09:21:06,238 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 7900, best=1.00, avg=1.00, std=0.00, steps=3.236e+07
2023-07-07 09:21:10,213 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 8000, best=1.00, avg=1.00, std=0.00, steps=3.277e+07
2023-07-07 09:21:14,172 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 8100, best=1.00, avg=1.00, std=0.00, steps=3.318e+07
2023-07-07 09:21:18,137 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 8200, best=1.00, avg=1.00, std=0.00, steps=3.359e+07
2023-07-07 09:21:22,122 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 8300, best=1.00, avg=1.00, std=0.00, steps=3.400e+07
2023-07-07 09:21:26,107 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 8400, best=1.00, avg=1.00, std=0.00, steps=3.441e+07
2023-07-07 09:21:30,096 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 8500, best=1.00, avg=1.00, std=0.00, steps=3.482e+07
2023-07-07 09:21:34,069 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 8600, best=1.00, avg=1.00, std=0.00, steps=3.523e+07
2023-07-07 09:21:38,046 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 8700, best=1.00, avg=1.00, std=0.00, steps=3.564e+07
2023-07-07 09:21:42,046 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 8800, best=1.00, avg=1.00, std=0.00, steps=3.605e+07
2023-07-07 09:21:46,033 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 8900, best=1.00, avg=1.00, std=0.00, steps=3.646e+07
2023-07-07 09:21:50,028 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 9000, best=1.00, avg=1.00, std=0.00, steps=3.687e+07
2023-07-07 09:21:54,011 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 9100, best=1.00, avg=1.00, std=0.00, steps=3.728e+07
2023-07-07 09:21:57,998 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 9200, best=1.00, avg=1.00, std=0.00, steps=3.769e+07
2023-07-07 09:22:02,008 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 9300, best=1.00, avg=1.00, std=0.00, steps=3.810e+07
2023-07-07 09:22:05,995 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 9400, best=1.00, avg=1.00, std=0.00, steps=3.851e+07
2023-07-07 09:22:10,008 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 9500, best=1.00, avg=1.00, std=0.00, steps=3.892e+07
2023-07-07 09:22:14,005 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 9600, best=1.00, avg=1.00, std=0.00, steps=3.933e+07
2023-07-07 09:22:17,991 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 9700, best=1.00, avg=1.00, std=0.00, steps=3.974e+07
2023-07-07 09:22:22,005 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 9800, best=1.00, avg=1.00, std=0.00, steps=4.014e+07
2023-07-07 09:22:25,988 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 9900, best=1.00, avg=1.00, std=0.00, steps=4.055e+07
2023-07-07 09:22:29,982 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 10000, best=1.00, avg=1.00, std=0.00, steps=4.096e+07
2023-07-07 09:22:33,964 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 10100, best=1.00, avg=1.00, std=0.00, steps=4.137e+07
2023-07-07 09:22:37,948 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 10200, best=1.00, avg=1.00, std=0.00, steps=4.178e+07
2023-07-07 09:22:41,926 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 10300, best=1.00, avg=1.00, std=0.00, steps=4.219e+07
2023-07-07 09:22:45,906 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 10400, best=1.00, avg=1.00, std=0.00, steps=4.260e+07
2023-07-07 09:22:49,893 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 10500, best=1.00, avg=1.00, std=0.00, steps=4.301e+07
2023-07-07 09:22:53,869 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 10600, best=1.00, avg=1.00, std=0.00, steps=4.342e+07
2023-07-07 09:22:57,852 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 10700, best=1.00, avg=1.00, std=0.00, steps=4.383e+07
2023-07-07 09:23:01,836 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 10800, best=1.00, avg=1.00, std=0.00, steps=4.424e+07
2023-07-07 09:23:05,827 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 10900, best=1.00, avg=1.00, std=0.00, steps=4.465e+07
2023-07-07 09:23:09,818 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 11000, best=1.00, avg=1.00, std=0.00, steps=4.506e+07
2023-07-07 09:23:13,821 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 11100, best=1.00, avg=1.00, std=0.00, steps=4.547e+07
2023-07-07 09:23:17,813 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 11200, best=1.00, avg=1.00, std=0.00, steps=4.588e+07
2023-07-07 09:23:21,808 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 11300, best=1.00, avg=1.00, std=0.00, steps=4.629e+07
2023-07-07 09:23:25,767 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 11400, best=1.00, avg=1.00, std=0.00, steps=4.670e+07
2023-07-07 09:23:29,751 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 11500, best=1.00, avg=1.00, std=0.00, steps=4.711e+07
2023-07-07 09:23:33,738 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 11600, best=1.00, avg=1.00, std=0.00, steps=4.752e+07
2023-07-07 09:23:37,717 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 11700, best=1.00, avg=1.00, std=0.00, steps=4.793e+07
2023-07-07 09:23:41,715 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 11800, best=1.00, avg=1.00, std=0.00, steps=4.834e+07
2023-07-07 09:23:45,717 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 11900, best=1.00, avg=1.00, std=0.00, steps=4.875e+07
2023-07-07 09:23:49,664 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 0, 1, [Train]: 11999, best=1.00, avg=1.00, std=0.00, steps=4.915e+07
2023-07-07 09:23:49,665 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 09:23:49,688 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 09:23:49,720 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 09:23:57,277 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 100, best=0.52, avg=0.50, std=0.01, steps=6.205e+05
2023-07-07 09:24:03,088 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 200, best=0.70, avg=0.69, std=0.01, steps=1.235e+06
2023-07-07 09:24:08,899 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 300, best=0.74, avg=0.72, std=0.01, steps=1.849e+06
2023-07-07 09:24:14,705 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 400, best=0.76, avg=0.75, std=0.01, steps=2.464e+06
2023-07-07 09:24:20,517 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 500, best=0.78, avg=0.77, std=0.01, steps=3.078e+06
2023-07-07 09:24:26,347 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 600, best=0.80, avg=0.79, std=0.01, steps=3.693e+06
2023-07-07 09:24:32,175 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 700, best=0.82, avg=0.81, std=0.01, steps=4.307e+06
2023-07-07 09:24:38,001 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 800, best=0.84, avg=0.82, std=0.01, steps=4.921e+06
2023-07-07 09:24:43,826 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 900, best=0.84, avg=0.83, std=0.01, steps=5.536e+06
2023-07-07 09:24:49,668 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 1000, best=0.85, avg=0.84, std=0.01, steps=6.150e+06
2023-07-07 09:24:55,514 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 1100, best=0.86, avg=0.85, std=0.01, steps=6.765e+06
2023-07-07 09:25:01,356 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 1200, best=0.87, avg=0.86, std=0.00, steps=7.379e+06
2023-07-07 09:25:07,178 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 1300, best=0.88, avg=0.87, std=0.00, steps=7.993e+06
2023-07-07 09:25:13,017 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 1400, best=0.89, avg=0.87, std=0.00, steps=8.608e+06
2023-07-07 09:25:18,840 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 1500, best=0.89, avg=0.88, std=0.00, steps=9.222e+06
2023-07-07 09:25:24,648 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 1600, best=0.89, avg=0.88, std=0.00, steps=9.837e+06
2023-07-07 09:25:30,487 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 1700, best=0.89, avg=0.88, std=0.00, steps=1.045e+07
2023-07-07 09:25:36,311 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 1800, best=0.89, avg=0.88, std=0.00, steps=1.107e+07
2023-07-07 09:25:42,136 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 1900, best=0.90, avg=0.89, std=0.00, steps=1.168e+07
2023-07-07 09:25:47,952 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 2000, best=0.90, avg=0.89, std=0.00, steps=1.229e+07
2023-07-07 09:25:53,743 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 2100, best=0.90, avg=0.89, std=0.00, steps=1.291e+07
2023-07-07 09:25:59,578 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 2200, best=0.90, avg=0.89, std=0.00, steps=1.352e+07
2023-07-07 09:26:05,423 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 2300, best=0.90, avg=0.89, std=0.00, steps=1.414e+07
2023-07-07 09:26:11,234 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 2400, best=0.90, avg=0.89, std=0.00, steps=1.475e+07
2023-07-07 09:26:17,038 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 2500, best=0.90, avg=0.89, std=0.00, steps=1.537e+07
2023-07-07 09:26:22,852 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 2600, best=0.90, avg=0.90, std=0.00, steps=1.598e+07
2023-07-07 09:26:28,667 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 2700, best=0.90, avg=0.90, std=0.00, steps=1.659e+07
2023-07-07 09:26:34,464 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 2800, best=0.90, avg=0.90, std=0.00, steps=1.721e+07
2023-07-07 09:26:40,286 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 2900, best=0.91, avg=0.90, std=0.00, steps=1.782e+07
2023-07-07 09:26:46,116 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 3000, best=0.91, avg=0.90, std=0.00, steps=1.844e+07
2023-07-07 09:26:51,945 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 3100, best=0.91, avg=0.90, std=0.00, steps=1.905e+07
2023-07-07 09:26:57,774 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 3200, best=0.91, avg=0.90, std=0.00, steps=1.967e+07
2023-07-07 09:27:03,594 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 3300, best=0.91, avg=0.90, std=0.00, steps=2.028e+07
2023-07-07 09:27:09,434 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 3400, best=0.91, avg=0.90, std=0.00, steps=2.090e+07
2023-07-07 09:27:15,222 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 3500, best=0.91, avg=0.90, std=0.00, steps=2.151e+07
2023-07-07 09:27:21,034 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 3600, best=0.91, avg=0.90, std=0.00, steps=2.212e+07
2023-07-07 09:27:26,826 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 3700, best=0.91, avg=0.90, std=0.00, steps=2.274e+07
2023-07-07 09:27:32,620 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 3800, best=0.91, avg=0.90, std=0.00, steps=2.335e+07
2023-07-07 09:27:38,431 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 3900, best=0.91, avg=0.90, std=0.00, steps=2.397e+07
2023-07-07 09:27:44,261 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 4000, best=0.91, avg=0.90, std=0.00, steps=2.458e+07
2023-07-07 09:27:50,086 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 4100, best=0.91, avg=0.90, std=0.00, steps=2.520e+07
2023-07-07 09:27:55,916 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 4200, best=0.91, avg=0.90, std=0.00, steps=2.581e+07
2023-07-07 09:28:01,753 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 4300, best=0.91, avg=0.90, std=0.00, steps=2.643e+07
2023-07-07 09:28:07,598 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 4400, best=0.91, avg=0.90, std=0.00, steps=2.704e+07
2023-07-07 09:28:13,384 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 4500, best=0.91, avg=0.90, std=0.00, steps=2.765e+07
2023-07-07 09:28:19,194 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 4600, best=0.91, avg=0.90, std=0.00, steps=2.827e+07
2023-07-07 09:28:25,025 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 4700, best=0.91, avg=0.90, std=0.00, steps=2.888e+07
2023-07-07 09:28:30,847 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 4800, best=0.91, avg=0.90, std=0.00, steps=2.950e+07
2023-07-07 09:28:36,661 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 4900, best=0.91, avg=0.90, std=0.00, steps=3.011e+07
2023-07-07 09:28:42,481 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 5000, best=0.91, avg=0.90, std=0.00, steps=3.073e+07
2023-07-07 09:28:48,323 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 5100, best=0.91, avg=0.90, std=0.00, steps=3.134e+07
2023-07-07 09:28:54,153 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 5200, best=0.91, avg=0.90, std=0.00, steps=3.195e+07
2023-07-07 09:28:59,989 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 5300, best=0.91, avg=0.90, std=0.00, steps=3.257e+07
2023-07-07 09:29:05,829 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 5400, best=0.92, avg=0.91, std=0.00, steps=3.318e+07
2023-07-07 09:29:11,665 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 5500, best=0.91, avg=0.91, std=0.00, steps=3.380e+07
2023-07-07 09:29:17,499 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 5600, best=0.91, avg=0.90, std=0.00, steps=3.441e+07
2023-07-07 09:29:23,324 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 5700, best=0.92, avg=0.90, std=0.00, steps=3.503e+07
2023-07-07 09:29:29,141 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 5800, best=0.91, avg=0.90, std=0.00, steps=3.564e+07
2023-07-07 09:29:34,963 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 5900, best=0.92, avg=0.90, std=0.00, steps=3.626e+07
2023-07-07 09:29:40,769 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 6000, best=0.91, avg=0.91, std=0.00, steps=3.687e+07
2023-07-07 09:29:46,598 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 6100, best=0.91, avg=0.91, std=0.00, steps=3.748e+07
2023-07-07 09:29:52,404 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 6200, best=0.91, avg=0.90, std=0.00, steps=3.810e+07
2023-07-07 09:29:58,186 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 6300, best=0.92, avg=0.91, std=0.00, steps=3.871e+07
2023-07-07 09:30:03,992 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 6400, best=0.92, avg=0.91, std=0.00, steps=3.933e+07
2023-07-07 09:30:09,808 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 6500, best=0.92, avg=0.91, std=0.00, steps=3.994e+07
2023-07-07 09:30:15,619 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 6600, best=0.92, avg=0.91, std=0.00, steps=4.056e+07
2023-07-07 09:30:21,442 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 6700, best=0.92, avg=0.91, std=0.00, steps=4.117e+07
2023-07-07 09:30:27,275 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 6800, best=0.92, avg=0.91, std=0.00, steps=4.179e+07
2023-07-07 09:30:33,093 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 6900, best=0.92, avg=0.91, std=0.00, steps=4.240e+07
2023-07-07 09:30:38,890 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 7000, best=0.93, avg=0.91, std=0.00, steps=4.301e+07
2023-07-07 09:30:44,710 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 7100, best=0.92, avg=0.92, std=0.00, steps=4.363e+07
2023-07-07 09:30:50,514 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 7200, best=0.93, avg=0.92, std=0.00, steps=4.424e+07
2023-07-07 09:30:56,304 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 7300, best=0.92, avg=0.92, std=0.00, steps=4.486e+07
2023-07-07 09:31:02,112 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 7400, best=0.93, avg=0.92, std=0.00, steps=4.547e+07
2023-07-07 09:31:07,952 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 7500, best=0.93, avg=0.92, std=0.00, steps=4.609e+07
2023-07-07 09:31:13,786 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 7600, best=0.93, avg=0.92, std=0.00, steps=4.670e+07
2023-07-07 09:31:19,592 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 7700, best=0.93, avg=0.92, std=0.00, steps=4.731e+07
2023-07-07 09:31:25,416 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 7800, best=0.93, avg=0.92, std=0.00, steps=4.793e+07
2023-07-07 09:31:31,239 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 7900, best=0.93, avg=0.92, std=0.00, steps=4.854e+07
2023-07-07 09:31:37,068 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 8000, best=0.93, avg=0.92, std=0.00, steps=4.916e+07
2023-07-07 09:31:42,899 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 8100, best=0.92, avg=0.92, std=0.00, steps=4.977e+07
2023-07-07 09:31:48,730 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 8200, best=0.92, avg=0.92, std=0.00, steps=5.039e+07
2023-07-07 09:31:54,563 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 8300, best=0.92, avg=0.92, std=0.00, steps=5.100e+07
2023-07-07 09:32:00,388 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 8400, best=0.92, avg=0.92, std=0.00, steps=5.162e+07
2023-07-07 09:32:06,203 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 8500, best=0.92, avg=0.92, std=0.00, steps=5.223e+07
2023-07-07 09:32:12,015 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 8600, best=0.93, avg=0.92, std=0.00, steps=5.284e+07
2023-07-07 09:32:17,853 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 8700, best=0.93, avg=0.92, std=0.00, steps=5.346e+07
2023-07-07 09:32:23,662 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 8800, best=0.92, avg=0.92, std=0.00, steps=5.407e+07
2023-07-07 09:32:29,461 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 8900, best=0.92, avg=0.91, std=0.00, steps=5.469e+07
2023-07-07 09:32:35,263 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 9000, best=0.93, avg=0.92, std=0.00, steps=5.530e+07
2023-07-07 09:32:41,068 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 9100, best=0.93, avg=0.92, std=0.00, steps=5.592e+07
2023-07-07 09:32:46,880 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 9200, best=0.92, avg=0.92, std=0.00, steps=5.653e+07
2023-07-07 09:32:52,697 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 9300, best=0.93, avg=0.92, std=0.00, steps=5.715e+07
2023-07-07 09:32:58,506 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 9400, best=0.93, avg=0.92, std=0.00, steps=5.776e+07
2023-07-07 09:33:04,319 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 9500, best=0.93, avg=0.92, std=0.00, steps=5.837e+07
2023-07-07 09:33:10,141 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 9600, best=0.93, avg=0.92, std=0.00, steps=5.899e+07
2023-07-07 09:33:15,973 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 9700, best=0.92, avg=0.92, std=0.00, steps=5.960e+07
2023-07-07 09:33:21,791 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 9800, best=0.93, avg=0.91, std=0.00, steps=6.022e+07
2023-07-07 09:33:27,599 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 9900, best=0.93, avg=0.92, std=0.00, steps=6.083e+07
2023-07-07 09:33:33,423 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 10000, best=0.93, avg=0.92, std=0.00, steps=6.145e+07
2023-07-07 09:33:39,244 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 10100, best=0.93, avg=0.92, std=0.00, steps=6.206e+07
2023-07-07 09:33:45,048 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 10200, best=0.93, avg=0.92, std=0.00, steps=6.267e+07
2023-07-07 09:33:50,834 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 10300, best=0.93, avg=0.92, std=0.00, steps=6.329e+07
2023-07-07 09:33:56,639 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 10400, best=0.93, avg=0.92, std=0.00, steps=6.390e+07
2023-07-07 09:34:02,458 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 10500, best=0.92, avg=0.92, std=0.00, steps=6.452e+07
2023-07-07 09:34:08,278 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 10600, best=0.93, avg=0.92, std=0.00, steps=6.513e+07
2023-07-07 09:34:14,091 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 10700, best=0.92, avg=0.92, std=0.00, steps=6.575e+07
2023-07-07 09:34:19,889 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 10800, best=0.93, avg=0.92, std=0.00, steps=6.636e+07
2023-07-07 09:34:25,713 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 10900, best=0.92, avg=0.92, std=0.00, steps=6.698e+07
2023-07-07 09:34:31,529 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 11000, best=0.92, avg=0.92, std=0.00, steps=6.759e+07
2023-07-07 09:34:37,340 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 11100, best=0.93, avg=0.92, std=0.00, steps=6.820e+07
2023-07-07 09:34:43,164 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 11200, best=0.93, avg=0.92, std=0.00, steps=6.882e+07
2023-07-07 09:34:48,977 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 11300, best=0.92, avg=0.92, std=0.00, steps=6.943e+07
2023-07-07 09:34:54,788 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 11400, best=0.93, avg=0.92, std=0.00, steps=7.005e+07
2023-07-07 09:35:00,587 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 11500, best=0.93, avg=0.92, std=0.00, steps=7.066e+07
2023-07-07 09:35:06,387 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 11600, best=0.93, avg=0.92, std=0.00, steps=7.128e+07
2023-07-07 09:35:12,181 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 11700, best=0.93, avg=0.92, std=0.00, steps=7.189e+07
2023-07-07 09:35:18,009 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 11800, best=0.93, avg=0.92, std=0.00, steps=7.251e+07
2023-07-07 09:35:23,836 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 11900, best=0.92, avg=0.92, std=0.00, steps=7.312e+07
2023-07-07 09:35:29,617 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 8, 1, [Train]: 11999, best=0.92, avg=0.92, std=0.00, steps=7.373e+07
2023-07-07 09:35:29,617 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 09:35:29,641 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 09:35:29,671 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 09:35:39,240 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 100, best=0.52, avg=0.50, std=0.01, steps=8.274e+05
2023-07-07 09:35:46,909 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 200, best=0.68, avg=0.66, std=0.01, steps=1.647e+06
2023-07-07 09:35:54,541 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 300, best=0.72, avg=0.70, std=0.01, steps=2.466e+06
2023-07-07 09:36:02,195 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 400, best=0.73, avg=0.71, std=0.01, steps=3.285e+06
2023-07-07 09:36:09,823 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 500, best=0.74, avg=0.73, std=0.01, steps=4.104e+06
2023-07-07 09:36:17,455 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 600, best=0.76, avg=0.74, std=0.01, steps=4.923e+06
2023-07-07 09:36:25,115 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 700, best=0.77, avg=0.76, std=0.01, steps=5.743e+06
2023-07-07 09:36:32,744 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 800, best=0.79, avg=0.77, std=0.01, steps=6.562e+06
2023-07-07 09:36:40,380 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 900, best=0.79, avg=0.77, std=0.01, steps=7.381e+06
2023-07-07 09:36:48,004 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 1000, best=0.80, avg=0.78, std=0.01, steps=8.200e+06
2023-07-07 09:36:55,581 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 1100, best=0.80, avg=0.79, std=0.01, steps=9.019e+06
2023-07-07 09:37:03,193 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 1200, best=0.81, avg=0.80, std=0.01, steps=9.839e+06
2023-07-07 09:37:10,797 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 1300, best=0.82, avg=0.80, std=0.00, steps=1.066e+07
2023-07-07 09:37:18,412 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 1400, best=0.83, avg=0.81, std=0.01, steps=1.148e+07
2023-07-07 09:37:26,045 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 1500, best=0.84, avg=0.82, std=0.00, steps=1.230e+07
2023-07-07 09:37:33,656 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 1600, best=0.84, avg=0.83, std=0.00, steps=1.312e+07
2023-07-07 09:37:41,275 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 1700, best=0.85, avg=0.83, std=0.01, steps=1.393e+07
2023-07-07 09:37:48,900 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 1800, best=0.85, avg=0.83, std=0.01, steps=1.475e+07
2023-07-07 09:37:56,563 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 1900, best=0.85, avg=0.84, std=0.00, steps=1.557e+07
2023-07-07 09:38:04,210 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 2000, best=0.85, avg=0.84, std=0.00, steps=1.639e+07
2023-07-07 09:38:11,868 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 2100, best=0.85, avg=0.84, std=0.00, steps=1.721e+07
2023-07-07 09:38:19,543 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 2200, best=0.85, avg=0.84, std=0.00, steps=1.803e+07
2023-07-07 09:38:27,206 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 2300, best=0.85, avg=0.84, std=0.01, steps=1.885e+07
2023-07-07 09:38:34,860 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 2400, best=0.86, avg=0.84, std=0.01, steps=1.967e+07
2023-07-07 09:38:42,525 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 2500, best=0.85, avg=0.85, std=0.00, steps=2.049e+07
2023-07-07 09:38:50,179 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 2600, best=0.86, avg=0.85, std=0.00, steps=2.131e+07
2023-07-07 09:38:57,821 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 2700, best=0.86, avg=0.85, std=0.00, steps=2.213e+07
2023-07-07 09:39:05,464 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 2800, best=0.86, avg=0.85, std=0.00, steps=2.295e+07
2023-07-07 09:39:13,114 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 2900, best=0.86, avg=0.85, std=0.00, steps=2.376e+07
2023-07-07 09:39:20,801 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 3000, best=0.87, avg=0.85, std=0.00, steps=2.458e+07
2023-07-07 09:39:28,478 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 3100, best=0.86, avg=0.85, std=0.00, steps=2.540e+07
2023-07-07 09:39:36,089 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 3200, best=0.86, avg=0.85, std=0.00, steps=2.622e+07
2023-07-07 09:39:43,743 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 3300, best=0.87, avg=0.86, std=0.00, steps=2.704e+07
2023-07-07 09:39:51,383 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 3400, best=0.87, avg=0.86, std=0.00, steps=2.786e+07
2023-07-07 09:39:59,013 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 3500, best=0.87, avg=0.86, std=0.00, steps=2.868e+07
2023-07-07 09:40:06,648 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 3600, best=0.87, avg=0.86, std=0.00, steps=2.950e+07
2023-07-07 09:40:14,269 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 3700, best=0.87, avg=0.86, std=0.00, steps=3.032e+07
2023-07-07 09:40:21,914 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 3800, best=0.87, avg=0.86, std=0.00, steps=3.114e+07
2023-07-07 09:40:29,568 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 3900, best=0.87, avg=0.86, std=0.00, steps=3.196e+07
2023-07-07 09:40:37,209 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 4000, best=0.87, avg=0.86, std=0.00, steps=3.278e+07
2023-07-07 09:40:44,843 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 4100, best=0.88, avg=0.87, std=0.00, steps=3.360e+07
2023-07-07 09:40:52,460 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 4200, best=0.88, avg=0.87, std=0.00, steps=3.441e+07
2023-07-07 09:41:00,118 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 4300, best=0.88, avg=0.87, std=0.00, steps=3.523e+07
2023-07-07 09:41:07,777 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 4400, best=0.88, avg=0.87, std=0.00, steps=3.605e+07
2023-07-07 09:41:15,418 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 4500, best=0.89, avg=0.88, std=0.00, steps=3.687e+07
2023-07-07 09:41:23,092 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 4600, best=0.89, avg=0.88, std=0.00, steps=3.769e+07
2023-07-07 09:41:30,728 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 4700, best=0.89, avg=0.88, std=0.00, steps=3.851e+07
2023-07-07 09:41:38,380 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 4800, best=0.89, avg=0.88, std=0.00, steps=3.933e+07
2023-07-07 09:41:46,046 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 4900, best=0.89, avg=0.88, std=0.00, steps=4.015e+07
2023-07-07 09:41:53,704 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 5000, best=0.89, avg=0.88, std=0.00, steps=4.097e+07
2023-07-07 09:42:01,379 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 5100, best=0.89, avg=0.88, std=0.00, steps=4.179e+07
2023-07-07 09:42:09,035 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 5200, best=0.89, avg=0.88, std=0.00, steps=4.261e+07
2023-07-07 09:42:16,678 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 5300, best=0.89, avg=0.88, std=0.00, steps=4.343e+07
2023-07-07 09:42:24,292 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 5400, best=0.89, avg=0.88, std=0.00, steps=4.424e+07
2023-07-07 09:42:31,915 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 5500, best=0.89, avg=0.88, std=0.00, steps=4.506e+07
2023-07-07 09:42:39,562 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 5600, best=0.89, avg=0.88, std=0.00, steps=4.588e+07
2023-07-07 09:42:47,219 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 5700, best=0.89, avg=0.88, std=0.00, steps=4.670e+07
2023-07-07 09:42:54,865 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 5800, best=0.89, avg=0.88, std=0.00, steps=4.752e+07
2023-07-07 09:43:02,498 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 5900, best=0.89, avg=0.88, std=0.00, steps=4.834e+07
2023-07-07 09:43:10,096 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 6000, best=0.89, avg=0.88, std=0.00, steps=4.916e+07
2023-07-07 09:43:17,719 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 6100, best=0.89, avg=0.88, std=0.00, steps=4.998e+07
2023-07-07 09:43:25,343 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 6200, best=0.89, avg=0.88, std=0.00, steps=5.080e+07
2023-07-07 09:43:32,977 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 6300, best=0.89, avg=0.88, std=0.00, steps=5.162e+07
2023-07-07 09:43:40,614 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 6400, best=0.89, avg=0.88, std=0.00, steps=5.244e+07
2023-07-07 09:43:48,257 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 6500, best=0.89, avg=0.88, std=0.00, steps=5.326e+07
2023-07-07 09:43:55,894 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 6600, best=0.89, avg=0.88, std=0.00, steps=5.408e+07
2023-07-07 09:44:03,533 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 6700, best=0.89, avg=0.88, std=0.00, steps=5.489e+07
2023-07-07 09:44:11,157 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 6800, best=0.89, avg=0.88, std=0.00, steps=5.571e+07
2023-07-07 09:44:18,773 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 6900, best=0.89, avg=0.88, std=0.00, steps=5.653e+07
2023-07-07 09:44:26,392 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 7000, best=0.89, avg=0.88, std=0.00, steps=5.735e+07
2023-07-07 09:44:34,007 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 7100, best=0.89, avg=0.88, std=0.00, steps=5.817e+07
2023-07-07 09:44:41,627 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 7200, best=0.89, avg=0.88, std=0.00, steps=5.899e+07
2023-07-07 09:44:49,247 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 7300, best=0.89, avg=0.88, std=0.00, steps=5.981e+07
2023-07-07 09:44:56,861 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 7400, best=0.89, avg=0.88, std=0.00, steps=6.063e+07
2023-07-07 09:45:04,511 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 7500, best=0.89, avg=0.88, std=0.00, steps=6.145e+07
2023-07-07 09:45:12,195 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 7600, best=0.89, avg=0.88, std=0.00, steps=6.227e+07
2023-07-07 09:45:19,824 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 7700, best=0.89, avg=0.88, std=0.00, steps=6.309e+07
2023-07-07 09:45:27,476 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 7800, best=0.89, avg=0.88, std=0.00, steps=6.391e+07
2023-07-07 09:45:35,127 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 7900, best=0.89, avg=0.88, std=0.00, steps=6.472e+07
2023-07-07 09:45:42,781 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 8000, best=0.89, avg=0.88, std=0.00, steps=6.554e+07
2023-07-07 09:45:50,424 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 8100, best=0.89, avg=0.88, std=0.00, steps=6.636e+07
2023-07-07 09:45:58,119 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 8200, best=0.90, avg=0.88, std=0.00, steps=6.718e+07
2023-07-07 09:46:05,796 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 8300, best=0.90, avg=0.88, std=0.00, steps=6.800e+07
2023-07-07 09:46:13,453 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 8400, best=0.89, avg=0.88, std=0.00, steps=6.882e+07
2023-07-07 09:46:21,107 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 8500, best=0.89, avg=0.88, std=0.00, steps=6.964e+07
2023-07-07 09:46:28,766 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 8600, best=0.89, avg=0.88, std=0.00, steps=7.046e+07
2023-07-07 09:46:36,423 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 8700, best=0.89, avg=0.88, std=0.00, steps=7.128e+07
2023-07-07 09:46:44,069 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 8800, best=0.89, avg=0.88, std=0.00, steps=7.210e+07
2023-07-07 09:46:51,706 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 8900, best=0.89, avg=0.88, std=0.00, steps=7.292e+07
2023-07-07 09:46:59,338 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 9000, best=0.89, avg=0.88, std=0.00, steps=7.374e+07
2023-07-07 09:47:06,958 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 9100, best=0.89, avg=0.88, std=0.00, steps=7.456e+07
2023-07-07 09:47:14,580 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 9200, best=0.89, avg=0.88, std=0.00, steps=7.537e+07
2023-07-07 09:47:22,196 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 9300, best=0.89, avg=0.88, std=0.00, steps=7.619e+07
2023-07-07 09:47:29,859 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 9400, best=0.89, avg=0.88, std=0.00, steps=7.701e+07
2023-07-07 09:47:37,512 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 9500, best=0.89, avg=0.88, std=0.00, steps=7.783e+07
2023-07-07 09:47:45,171 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 9600, best=0.89, avg=0.88, std=0.00, steps=7.865e+07
2023-07-07 09:47:52,823 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 9700, best=0.89, avg=0.88, std=0.00, steps=7.947e+07
2023-07-07 09:48:00,483 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 9800, best=0.89, avg=0.88, std=0.00, steps=8.029e+07
2023-07-07 09:48:08,124 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 9900, best=0.90, avg=0.88, std=0.00, steps=8.111e+07
2023-07-07 09:48:15,752 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 10000, best=0.89, avg=0.88, std=0.00, steps=8.193e+07
2023-07-07 09:48:23,395 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 10100, best=0.89, avg=0.88, std=0.00, steps=8.275e+07
2023-07-07 09:48:31,062 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 10200, best=0.89, avg=0.88, std=0.00, steps=8.357e+07
2023-07-07 09:48:38,702 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 10300, best=0.89, avg=0.88, std=0.00, steps=8.439e+07
2023-07-07 09:48:46,328 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 10400, best=0.89, avg=0.88, std=0.00, steps=8.520e+07
2023-07-07 09:48:53,928 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 10500, best=0.89, avg=0.88, std=0.00, steps=8.602e+07
2023-07-07 09:49:01,556 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 10600, best=0.89, avg=0.88, std=0.00, steps=8.684e+07
2023-07-07 09:49:09,193 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 10700, best=0.89, avg=0.88, std=0.00, steps=8.766e+07
2023-07-07 09:49:16,828 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 10800, best=0.89, avg=0.88, std=0.00, steps=8.848e+07
2023-07-07 09:49:24,458 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 10900, best=0.89, avg=0.88, std=0.00, steps=8.930e+07
2023-07-07 09:49:32,081 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 11000, best=0.89, avg=0.88, std=0.00, steps=9.012e+07
2023-07-07 09:49:39,709 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 11100, best=0.89, avg=0.88, std=0.00, steps=9.094e+07
2023-07-07 09:49:47,368 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 11200, best=0.89, avg=0.88, std=0.00, steps=9.176e+07
2023-07-07 09:49:55,021 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 11300, best=0.89, avg=0.88, std=0.00, steps=9.258e+07
2023-07-07 09:50:02,667 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 11400, best=0.89, avg=0.88, std=0.00, steps=9.340e+07
2023-07-07 09:50:10,322 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 11500, best=0.89, avg=0.88, std=0.00, steps=9.422e+07
2023-07-07 09:50:17,946 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 11600, best=0.89, avg=0.88, std=0.00, steps=9.504e+07
2023-07-07 09:50:25,584 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 11700, best=0.89, avg=0.88, std=0.00, steps=9.585e+07
2023-07-07 09:50:33,202 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 11800, best=0.89, avg=0.88, std=0.00, steps=9.667e+07
2023-07-07 09:50:40,847 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 11900, best=0.89, avg=0.88, std=0.00, steps=9.749e+07
2023-07-07 09:50:48,378 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 16, 1, [Train]: 11999, best=0.89, avg=0.88, std=0.00, steps=9.830e+07
2023-07-07 09:50:48,378 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 09:50:48,401 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 09:50:48,432 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 09:51:01,648 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 100, best=0.52, avg=0.50, std=0.01, steps=1.241e+06
2023-07-07 09:51:12,923 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 200, best=0.52, avg=0.50, std=0.01, steps=2.470e+06
2023-07-07 09:51:24,221 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 300, best=0.52, avg=0.50, std=0.01, steps=3.699e+06
2023-07-07 09:51:35,559 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 400, best=0.52, avg=0.50, std=0.01, steps=4.927e+06
2023-07-07 09:51:46,915 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 500, best=0.52, avg=0.50, std=0.01, steps=6.156e+06
2023-07-07 09:51:58,219 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 600, best=0.52, avg=0.50, std=0.01, steps=7.385e+06
2023-07-07 09:52:09,507 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 700, best=0.52, avg=0.50, std=0.01, steps=8.614e+06
2023-07-07 09:52:20,806 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 800, best=0.52, avg=0.50, std=0.01, steps=9.843e+06
2023-07-07 09:52:32,146 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 900, best=0.52, avg=0.50, std=0.01, steps=1.107e+07
2023-07-07 09:52:43,407 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 1000, best=0.52, avg=0.50, std=0.01, steps=1.230e+07
2023-07-07 09:52:54,699 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 1100, best=0.52, avg=0.50, std=0.01, steps=1.353e+07
2023-07-07 09:53:05,972 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 1200, best=0.52, avg=0.50, std=0.01, steps=1.476e+07
2023-07-07 09:53:17,304 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 1300, best=0.52, avg=0.50, std=0.01, steps=1.599e+07
2023-07-07 09:53:28,636 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 1400, best=0.51, avg=0.50, std=0.01, steps=1.722e+07
2023-07-07 09:53:39,975 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 1500, best=0.52, avg=0.50, std=0.01, steps=1.844e+07
2023-07-07 09:53:51,275 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 1600, best=0.52, avg=0.50, std=0.01, steps=1.967e+07
2023-07-07 09:54:02,583 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 1700, best=0.52, avg=0.50, std=0.01, steps=2.090e+07
2023-07-07 09:54:13,899 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 1800, best=0.52, avg=0.50, std=0.01, steps=2.213e+07
2023-07-07 09:54:25,191 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 1900, best=0.52, avg=0.50, std=0.01, steps=2.336e+07
2023-07-07 09:54:36,496 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 2000, best=0.52, avg=0.50, std=0.01, steps=2.459e+07
2023-07-07 09:54:47,841 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 2100, best=0.52, avg=0.50, std=0.01, steps=2.582e+07
2023-07-07 09:54:59,185 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 2200, best=0.53, avg=0.50, std=0.01, steps=2.705e+07
2023-07-07 09:55:10,488 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 2300, best=0.52, avg=0.50, std=0.01, steps=2.827e+07
2023-07-07 09:55:21,786 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 2400, best=0.52, avg=0.50, std=0.01, steps=2.950e+07
2023-07-07 09:55:33,070 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 2500, best=0.53, avg=0.50, std=0.01, steps=3.073e+07
2023-07-07 09:55:44,396 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 2600, best=0.52, avg=0.50, std=0.01, steps=3.196e+07
2023-07-07 09:55:55,724 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 2700, best=0.52, avg=0.50, std=0.01, steps=3.319e+07
2023-07-07 09:56:07,061 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 2800, best=0.52, avg=0.50, std=0.01, steps=3.442e+07
2023-07-07 09:56:18,419 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 2900, best=0.52, avg=0.50, std=0.01, steps=3.565e+07
2023-07-07 09:56:29,751 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 3000, best=0.52, avg=0.50, std=0.01, steps=3.688e+07
2023-07-07 09:56:41,045 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 3100, best=0.52, avg=0.50, std=0.01, steps=3.811e+07
2023-07-07 09:56:52,330 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 3200, best=0.52, avg=0.50, std=0.01, steps=3.933e+07
2023-07-07 09:57:03,657 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 3300, best=0.53, avg=0.50, std=0.01, steps=4.056e+07
2023-07-07 09:57:15,072 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 3400, best=0.52, avg=0.50, std=0.01, steps=4.179e+07
2023-07-07 09:57:26,390 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 3500, best=0.52, avg=0.50, std=0.01, steps=4.302e+07
2023-07-07 09:57:37,703 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 3600, best=0.52, avg=0.50, std=0.01, steps=4.425e+07
2023-07-07 09:57:48,985 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 3700, best=0.52, avg=0.50, std=0.01, steps=4.548e+07
2023-07-07 09:58:00,260 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 3800, best=0.52, avg=0.50, std=0.01, steps=4.671e+07
2023-07-07 09:58:11,588 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 3900, best=0.53, avg=0.50, std=0.01, steps=4.794e+07
2023-07-07 09:58:22,941 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 4000, best=0.52, avg=0.50, std=0.01, steps=4.916e+07
2023-07-07 09:58:34,276 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 4100, best=0.52, avg=0.50, std=0.01, steps=5.039e+07
2023-07-07 09:58:45,619 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 4200, best=0.52, avg=0.50, std=0.01, steps=5.162e+07
2023-07-07 09:58:56,939 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 4300, best=0.52, avg=0.50, std=0.01, steps=5.285e+07
2023-07-07 09:59:08,260 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 4400, best=0.52, avg=0.50, std=0.01, steps=5.408e+07
2023-07-07 09:59:19,537 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 4500, best=0.52, avg=0.50, std=0.01, steps=5.531e+07
2023-07-07 09:59:30,822 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 4600, best=0.52, avg=0.50, std=0.01, steps=5.654e+07
2023-07-07 09:59:42,134 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 4700, best=0.52, avg=0.50, std=0.01, steps=5.777e+07
2023-07-07 09:59:53,461 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 4800, best=0.52, avg=0.50, std=0.01, steps=5.899e+07
2023-07-07 10:00:04,798 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 4900, best=0.53, avg=0.50, std=0.01, steps=6.022e+07
2023-07-07 10:00:16,119 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 5000, best=0.52, avg=0.50, std=0.01, steps=6.145e+07
2023-07-07 10:00:27,425 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 5100, best=0.53, avg=0.50, std=0.01, steps=6.268e+07
2023-07-07 10:00:38,737 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 5200, best=0.51, avg=0.50, std=0.01, steps=6.391e+07
2023-07-07 10:00:50,051 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 5300, best=0.52, avg=0.50, std=0.01, steps=6.514e+07
2023-07-07 10:01:01,400 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 5400, best=0.52, avg=0.50, std=0.01, steps=6.637e+07
2023-07-07 10:01:12,718 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 5500, best=0.52, avg=0.50, std=0.01, steps=6.760e+07
2023-07-07 10:01:24,020 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 5600, best=0.52, avg=0.50, std=0.01, steps=6.883e+07
2023-07-07 10:01:35,289 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 5700, best=0.52, avg=0.50, std=0.01, steps=7.005e+07
2023-07-07 10:01:46,572 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 5800, best=0.52, avg=0.50, std=0.01, steps=7.128e+07
2023-07-07 10:01:57,899 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 5900, best=0.52, avg=0.50, std=0.01, steps=7.251e+07
2023-07-07 10:02:09,207 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 6000, best=0.52, avg=0.50, std=0.01, steps=7.374e+07
2023-07-07 10:02:20,491 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 6100, best=0.52, avg=0.50, std=0.01, steps=7.497e+07
2023-07-07 10:02:31,789 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 6200, best=0.52, avg=0.50, std=0.01, steps=7.620e+07
2023-07-07 10:02:43,107 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 6300, best=0.52, avg=0.50, std=0.01, steps=7.743e+07
2023-07-07 10:02:54,422 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 6400, best=0.52, avg=0.50, std=0.01, steps=7.866e+07
2023-07-07 10:03:05,807 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 6500, best=0.52, avg=0.50, std=0.01, steps=7.988e+07
2023-07-07 10:03:17,154 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 6600, best=0.52, avg=0.50, std=0.01, steps=8.111e+07
2023-07-07 10:03:28,464 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 6700, best=0.52, avg=0.50, std=0.01, steps=8.234e+07
2023-07-07 10:03:39,772 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 6800, best=0.52, avg=0.50, std=0.01, steps=8.357e+07
2023-07-07 10:03:51,051 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 6900, best=0.52, avg=0.50, std=0.01, steps=8.480e+07
2023-07-07 10:04:02,332 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 7000, best=0.53, avg=0.50, std=0.01, steps=8.603e+07
2023-07-07 10:04:13,612 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 7100, best=0.52, avg=0.50, std=0.01, steps=8.726e+07
2023-07-07 10:04:24,914 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 7200, best=0.52, avg=0.50, std=0.01, steps=8.849e+07
2023-07-07 10:04:36,243 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 7300, best=0.52, avg=0.50, std=0.01, steps=8.971e+07
2023-07-07 10:04:47,555 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 7400, best=0.52, avg=0.50, std=0.01, steps=9.094e+07
2023-07-07 10:04:58,859 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 7500, best=0.52, avg=0.50, std=0.01, steps=9.217e+07
2023-07-07 10:05:10,166 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 7600, best=0.52, avg=0.50, std=0.01, steps=9.340e+07
2023-07-07 10:05:21,506 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 7700, best=0.52, avg=0.50, std=0.01, steps=9.463e+07
2023-07-07 10:05:32,791 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 7800, best=0.52, avg=0.50, std=0.01, steps=9.586e+07
2023-07-07 10:05:44,100 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 7900, best=0.52, avg=0.50, std=0.01, steps=9.709e+07
2023-07-07 10:05:55,410 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 8000, best=0.51, avg=0.50, std=0.01, steps=9.832e+07
2023-07-07 10:06:06,721 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 8100, best=0.52, avg=0.50, std=0.01, steps=9.955e+07
2023-07-07 10:06:18,033 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 8200, best=0.52, avg=0.50, std=0.01, steps=1.008e+08
2023-07-07 10:06:29,324 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 8300, best=0.52, avg=0.50, std=0.01, steps=1.020e+08
2023-07-07 10:06:40,645 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 8400, best=0.52, avg=0.50, std=0.01, steps=1.032e+08
2023-07-07 10:06:51,963 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 8500, best=0.51, avg=0.50, std=0.01, steps=1.045e+08
2023-07-07 10:07:03,272 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 8600, best=0.52, avg=0.50, std=0.01, steps=1.057e+08
2023-07-07 10:07:14,617 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 8700, best=0.52, avg=0.50, std=0.01, steps=1.069e+08
2023-07-07 10:07:25,945 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 8800, best=0.52, avg=0.50, std=0.01, steps=1.081e+08
2023-07-07 10:07:37,276 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 8900, best=0.52, avg=0.50, std=0.01, steps=1.094e+08
2023-07-07 10:07:48,578 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 9000, best=0.52, avg=0.50, std=0.01, steps=1.106e+08
2023-07-07 10:07:59,887 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 9100, best=0.52, avg=0.50, std=0.01, steps=1.118e+08
2023-07-07 10:08:11,209 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 9200, best=0.52, avg=0.50, std=0.01, steps=1.131e+08
2023-07-07 10:08:22,515 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 9300, best=0.52, avg=0.50, std=0.01, steps=1.143e+08
2023-07-07 10:08:33,825 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 9400, best=0.53, avg=0.50, std=0.01, steps=1.155e+08
2023-07-07 10:08:45,116 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 9500, best=0.52, avg=0.50, std=0.01, steps=1.167e+08
2023-07-07 10:08:56,423 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 9600, best=0.65, avg=0.64, std=0.01, steps=1.180e+08
2023-07-07 10:09:07,727 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 9700, best=0.68, avg=0.66, std=0.00, steps=1.192e+08
2023-07-07 10:09:19,034 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 9800, best=0.70, avg=0.68, std=0.01, steps=1.204e+08
2023-07-07 10:09:30,340 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 9900, best=0.72, avg=0.70, std=0.01, steps=1.217e+08
2023-07-07 10:09:41,714 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 10000, best=0.72, avg=0.70, std=0.01, steps=1.229e+08
2023-07-07 10:09:53,058 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 10100, best=0.72, avg=0.71, std=0.01, steps=1.241e+08
2023-07-07 10:10:04,404 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 10200, best=0.73, avg=0.71, std=0.01, steps=1.253e+08
2023-07-07 10:10:15,764 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 10300, best=0.73, avg=0.72, std=0.01, steps=1.266e+08
2023-07-07 10:10:27,113 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 10400, best=0.73, avg=0.72, std=0.00, steps=1.278e+08
2023-07-07 10:10:38,448 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 10500, best=0.74, avg=0.72, std=0.01, steps=1.290e+08
2023-07-07 10:10:49,782 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 10600, best=0.74, avg=0.73, std=0.01, steps=1.303e+08
2023-07-07 10:11:01,082 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 10700, best=0.74, avg=0.73, std=0.01, steps=1.315e+08
2023-07-07 10:11:12,404 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 10800, best=0.74, avg=0.73, std=0.01, steps=1.327e+08
2023-07-07 10:11:23,690 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 10900, best=0.75, avg=0.73, std=0.01, steps=1.340e+08
2023-07-07 10:11:34,965 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 11000, best=0.75, avg=0.73, std=0.01, steps=1.352e+08
2023-07-07 10:11:46,256 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 11100, best=0.75, avg=0.73, std=0.01, steps=1.364e+08
2023-07-07 10:11:57,558 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 11200, best=0.76, avg=0.74, std=0.01, steps=1.376e+08
2023-07-07 10:12:08,885 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 11300, best=0.76, avg=0.75, std=0.01, steps=1.389e+08
2023-07-07 10:12:20,229 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 11400, best=0.76, avg=0.74, std=0.01, steps=1.401e+08
2023-07-07 10:12:31,550 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 11500, best=0.76, avg=0.75, std=0.01, steps=1.413e+08
2023-07-07 10:12:42,869 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 11600, best=0.76, avg=0.75, std=0.01, steps=1.426e+08
2023-07-07 10:12:54,157 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 11700, best=0.77, avg=0.75, std=0.01, steps=1.438e+08
2023-07-07 10:13:05,450 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 11800, best=0.77, avg=0.75, std=0.01, steps=1.450e+08
2023-07-07 10:13:16,762 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 11900, best=0.76, avg=0.75, std=0.01, steps=1.462e+08
2023-07-07 10:13:27,978 -        meta learning: [    INFO] - [Len Lat Rep]: 8, 32, 1, [Train]: 11999, best=0.77, avg=0.76, std=0.01, steps=1.475e+08
2023-07-07 10:13:27,979 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 10:13:28,003 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 10:13:28,033 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 10:13:37,573 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 100, best=0.64, avg=0.63, std=0.00, steps=8.274e+05
2023-07-07 10:13:45,200 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 200, best=0.71, avg=0.70, std=0.00, steps=1.647e+06
2023-07-07 10:13:52,829 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 300, best=0.76, avg=0.75, std=0.00, steps=2.466e+06
2023-07-07 10:14:00,466 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 400, best=0.78, avg=0.77, std=0.00, steps=3.285e+06
2023-07-07 10:14:08,080 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 500, best=0.79, avg=0.78, std=0.00, steps=4.104e+06
2023-07-07 10:14:15,701 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 600, best=0.80, avg=0.79, std=0.00, steps=4.923e+06
2023-07-07 10:14:23,317 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 700, best=0.82, avg=0.81, std=0.00, steps=5.743e+06
2023-07-07 10:14:30,942 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 800, best=0.83, avg=0.82, std=0.00, steps=6.562e+06
2023-07-07 10:14:38,600 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 900, best=0.85, avg=0.83, std=0.00, steps=7.381e+06
2023-07-07 10:14:46,312 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 1000, best=0.86, avg=0.85, std=0.00, steps=8.200e+06
2023-07-07 10:14:53,956 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 1100, best=0.86, avg=0.85, std=0.00, steps=9.019e+06
2023-07-07 10:15:01,573 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 1200, best=0.87, avg=0.86, std=0.00, steps=9.839e+06
2023-07-07 10:15:09,228 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 1300, best=0.87, avg=0.87, std=0.00, steps=1.066e+07
2023-07-07 10:15:16,847 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 1400, best=0.88, avg=0.87, std=0.00, steps=1.148e+07
2023-07-07 10:15:24,505 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 1500, best=0.88, avg=0.88, std=0.00, steps=1.230e+07
2023-07-07 10:15:32,137 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 1600, best=0.89, avg=0.88, std=0.00, steps=1.312e+07
2023-07-07 10:15:39,759 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 1700, best=0.89, avg=0.88, std=0.00, steps=1.393e+07
2023-07-07 10:15:47,389 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 1800, best=0.89, avg=0.88, std=0.00, steps=1.475e+07
2023-07-07 10:15:55,024 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 1900, best=0.89, avg=0.89, std=0.00, steps=1.557e+07
2023-07-07 10:16:02,656 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 2000, best=0.90, avg=0.89, std=0.00, steps=1.639e+07
2023-07-07 10:16:10,264 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 2100, best=0.90, avg=0.89, std=0.00, steps=1.721e+07
2023-07-07 10:16:17,883 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 2200, best=0.90, avg=0.89, std=0.00, steps=1.803e+07
2023-07-07 10:16:25,506 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 2300, best=0.90, avg=0.89, std=0.00, steps=1.885e+07
2023-07-07 10:16:33,168 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 2400, best=0.90, avg=0.90, std=0.00, steps=1.967e+07
2023-07-07 10:16:40,841 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 2500, best=0.90, avg=0.90, std=0.00, steps=2.049e+07
2023-07-07 10:16:48,504 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 2600, best=0.91, avg=0.90, std=0.00, steps=2.131e+07
2023-07-07 10:16:56,163 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 2700, best=0.91, avg=0.90, std=0.00, steps=2.213e+07
2023-07-07 10:17:03,787 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 2800, best=0.91, avg=0.90, std=0.00, steps=2.295e+07
2023-07-07 10:17:11,400 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 2900, best=0.91, avg=0.90, std=0.00, steps=2.376e+07
2023-07-07 10:17:19,026 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 3000, best=0.91, avg=0.90, std=0.00, steps=2.458e+07
2023-07-07 10:17:26,666 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 3100, best=0.91, avg=0.90, std=0.00, steps=2.540e+07
2023-07-07 10:17:34,307 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 3200, best=0.91, avg=0.90, std=0.00, steps=2.622e+07
2023-07-07 10:17:41,951 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 3300, best=0.91, avg=0.90, std=0.00, steps=2.704e+07
2023-07-07 10:17:49,612 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 3400, best=0.91, avg=0.90, std=0.00, steps=2.786e+07
2023-07-07 10:17:57,364 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 3500, best=0.91, avg=0.90, std=0.00, steps=2.868e+07
2023-07-07 10:18:05,002 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 3600, best=0.91, avg=0.90, std=0.00, steps=2.950e+07
2023-07-07 10:18:12,624 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 3700, best=0.91, avg=0.91, std=0.00, steps=3.032e+07
2023-07-07 10:18:20,272 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 3800, best=0.91, avg=0.91, std=0.00, steps=3.114e+07
2023-07-07 10:18:27,914 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 3900, best=0.91, avg=0.91, std=0.00, steps=3.196e+07
2023-07-07 10:18:35,516 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 4000, best=0.91, avg=0.91, std=0.00, steps=3.278e+07
2023-07-07 10:18:43,117 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 4100, best=0.91, avg=0.91, std=0.00, steps=3.360e+07
2023-07-07 10:18:50,767 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 4200, best=0.91, avg=0.91, std=0.00, steps=3.441e+07
2023-07-07 10:18:58,407 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 4300, best=0.92, avg=0.91, std=0.00, steps=3.523e+07
2023-07-07 10:19:06,030 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 4400, best=0.91, avg=0.91, std=0.00, steps=3.605e+07
2023-07-07 10:19:13,665 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 4500, best=0.92, avg=0.91, std=0.00, steps=3.687e+07
2023-07-07 10:19:21,310 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 4600, best=0.91, avg=0.91, std=0.00, steps=3.769e+07
2023-07-07 10:19:28,930 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 4700, best=0.92, avg=0.91, std=0.00, steps=3.851e+07
2023-07-07 10:19:36,581 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 4800, best=0.92, avg=0.91, std=0.00, steps=3.933e+07
2023-07-07 10:19:44,224 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 4900, best=0.91, avg=0.91, std=0.00, steps=4.015e+07
2023-07-07 10:19:51,851 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 5000, best=0.92, avg=0.91, std=0.00, steps=4.097e+07
2023-07-07 10:19:59,485 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 5100, best=0.91, avg=0.91, std=0.00, steps=4.179e+07
2023-07-07 10:20:07,231 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 5200, best=0.92, avg=0.91, std=0.00, steps=4.261e+07
2023-07-07 10:20:14,873 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 5300, best=0.92, avg=0.91, std=0.00, steps=4.343e+07
2023-07-07 10:20:22,516 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 5400, best=0.92, avg=0.91, std=0.00, steps=4.424e+07
2023-07-07 10:20:30,151 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 5500, best=0.92, avg=0.91, std=0.00, steps=4.506e+07
2023-07-07 10:20:37,767 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 5600, best=0.92, avg=0.91, std=0.00, steps=4.588e+07
2023-07-07 10:20:45,385 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 5700, best=0.92, avg=0.91, std=0.00, steps=4.670e+07
2023-07-07 10:20:53,027 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 5800, best=0.92, avg=0.91, std=0.00, steps=4.752e+07
2023-07-07 10:21:00,676 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 5900, best=0.92, avg=0.91, std=0.00, steps=4.834e+07
2023-07-07 10:21:08,298 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 6000, best=0.92, avg=0.91, std=0.00, steps=4.916e+07
2023-07-07 10:21:15,946 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 6100, best=0.92, avg=0.91, std=0.00, steps=4.998e+07
2023-07-07 10:21:23,601 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 6200, best=0.92, avg=0.91, std=0.00, steps=5.080e+07
2023-07-07 10:21:31,254 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 6300, best=0.92, avg=0.91, std=0.00, steps=5.162e+07
2023-07-07 10:21:38,884 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 6400, best=0.92, avg=0.91, std=0.00, steps=5.244e+07
2023-07-07 10:21:46,529 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 6500, best=0.92, avg=0.91, std=0.00, steps=5.326e+07
2023-07-07 10:21:54,168 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 6600, best=0.92, avg=0.91, std=0.00, steps=5.408e+07
2023-07-07 10:22:01,799 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 6700, best=0.92, avg=0.91, std=0.00, steps=5.489e+07
2023-07-07 10:22:09,433 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 6800, best=0.92, avg=0.91, std=0.00, steps=5.571e+07
2023-07-07 10:22:17,137 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 6900, best=0.92, avg=0.91, std=0.00, steps=5.653e+07
2023-07-07 10:22:24,867 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 7000, best=0.92, avg=0.91, std=0.00, steps=5.735e+07
2023-07-07 10:22:32,503 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 7100, best=0.92, avg=0.91, std=0.00, steps=5.817e+07
2023-07-07 10:22:40,149 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 7200, best=0.92, avg=0.91, std=0.00, steps=5.899e+07
2023-07-07 10:22:47,803 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 7300, best=0.92, avg=0.91, std=0.00, steps=5.981e+07
2023-07-07 10:22:55,445 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 7400, best=0.92, avg=0.91, std=0.00, steps=6.063e+07
2023-07-07 10:23:03,073 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 7500, best=0.92, avg=0.91, std=0.00, steps=6.145e+07
2023-07-07 10:23:10,710 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 7600, best=0.92, avg=0.91, std=0.00, steps=6.227e+07
2023-07-07 10:23:18,363 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 7700, best=0.92, avg=0.91, std=0.00, steps=6.309e+07
2023-07-07 10:23:26,006 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 7800, best=0.92, avg=0.91, std=0.00, steps=6.391e+07
2023-07-07 10:23:33,659 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 7900, best=0.92, avg=0.91, std=0.00, steps=6.472e+07
2023-07-07 10:23:41,282 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 8000, best=0.92, avg=0.91, std=0.00, steps=6.554e+07
2023-07-07 10:23:48,875 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 8100, best=0.92, avg=0.91, std=0.00, steps=6.636e+07
2023-07-07 10:23:56,530 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 8200, best=0.92, avg=0.91, std=0.00, steps=6.718e+07
2023-07-07 10:24:04,176 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 8300, best=0.92, avg=0.91, std=0.00, steps=6.800e+07
2023-07-07 10:24:11,825 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 8400, best=0.92, avg=0.91, std=0.00, steps=6.882e+07
2023-07-07 10:24:19,467 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 8500, best=0.92, avg=0.91, std=0.00, steps=6.964e+07
2023-07-07 10:24:27,117 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 8600, best=0.92, avg=0.91, std=0.00, steps=7.046e+07
2023-07-07 10:24:34,775 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 8700, best=0.92, avg=0.91, std=0.00, steps=7.128e+07
2023-07-07 10:24:42,428 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 8800, best=0.92, avg=0.91, std=0.00, steps=7.210e+07
2023-07-07 10:24:50,146 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 8900, best=0.92, avg=0.91, std=0.00, steps=7.292e+07
2023-07-07 10:24:57,815 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 9000, best=0.92, avg=0.91, std=0.00, steps=7.374e+07
2023-07-07 10:25:05,508 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 9100, best=0.92, avg=0.91, std=0.00, steps=7.456e+07
2023-07-07 10:25:13,142 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 9200, best=0.92, avg=0.92, std=0.00, steps=7.537e+07
2023-07-07 10:25:20,806 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 9300, best=0.92, avg=0.92, std=0.00, steps=7.619e+07
2023-07-07 10:25:28,474 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 9400, best=0.92, avg=0.92, std=0.00, steps=7.701e+07
2023-07-07 10:25:36,122 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 9500, best=0.92, avg=0.92, std=0.00, steps=7.783e+07
2023-07-07 10:25:43,774 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 9600, best=0.92, avg=0.92, std=0.00, steps=7.865e+07
2023-07-07 10:25:51,438 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 9700, best=0.93, avg=0.92, std=0.00, steps=7.947e+07
2023-07-07 10:25:59,094 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 9800, best=0.92, avg=0.92, std=0.00, steps=8.029e+07
2023-07-07 10:26:06,731 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 9900, best=0.93, avg=0.92, std=0.00, steps=8.111e+07
2023-07-07 10:26:14,400 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 10000, best=0.93, avg=0.92, std=0.00, steps=8.193e+07
2023-07-07 10:26:22,009 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 10100, best=0.93, avg=0.92, std=0.00, steps=8.275e+07
2023-07-07 10:26:29,637 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 10200, best=0.93, avg=0.92, std=0.00, steps=8.357e+07
2023-07-07 10:26:37,272 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 10300, best=0.93, avg=0.92, std=0.00, steps=8.439e+07
2023-07-07 10:26:44,920 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 10400, best=0.93, avg=0.92, std=0.00, steps=8.520e+07
2023-07-07 10:26:52,579 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 10500, best=0.93, avg=0.92, std=0.00, steps=8.602e+07
2023-07-07 10:27:00,244 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 10600, best=0.93, avg=0.93, std=0.00, steps=8.684e+07
2023-07-07 10:27:07,889 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 10700, best=0.93, avg=0.92, std=0.00, steps=8.766e+07
2023-07-07 10:27:15,526 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 10800, best=0.93, avg=0.93, std=0.00, steps=8.848e+07
2023-07-07 10:27:23,140 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 10900, best=0.93, avg=0.93, std=0.00, steps=8.930e+07
2023-07-07 10:27:30,784 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 11000, best=0.93, avg=0.93, std=0.00, steps=9.012e+07
2023-07-07 10:27:38,421 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 11100, best=0.93, avg=0.93, std=0.00, steps=9.094e+07
2023-07-07 10:27:46,081 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 11200, best=0.93, avg=0.93, std=0.00, steps=9.176e+07
2023-07-07 10:27:53,714 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 11300, best=0.93, avg=0.93, std=0.00, steps=9.258e+07
2023-07-07 10:28:01,352 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 11400, best=0.93, avg=0.93, std=0.00, steps=9.340e+07
2023-07-07 10:28:09,016 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 11500, best=0.93, avg=0.93, std=0.00, steps=9.422e+07
2023-07-07 10:28:16,651 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 11600, best=0.93, avg=0.93, std=0.00, steps=9.504e+07
2023-07-07 10:28:24,286 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 11700, best=0.94, avg=0.93, std=0.00, steps=9.585e+07
2023-07-07 10:28:31,922 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 11800, best=0.94, avg=0.93, std=0.00, steps=9.667e+07
2023-07-07 10:28:39,553 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 11900, best=0.94, avg=0.93, std=0.00, steps=9.749e+07
2023-07-07 10:28:47,117 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 0, 1, [Train]: 11999, best=0.93, avg=0.93, std=0.00, steps=9.830e+07
2023-07-07 10:28:47,118 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 10:28:47,142 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 10:28:47,178 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 10:28:58,506 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 100, best=0.51, avg=0.50, std=0.01, steps=1.034e+06
2023-07-07 10:29:08,005 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 200, best=0.51, avg=0.50, std=0.01, steps=2.058e+06
2023-07-07 10:29:17,524 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 300, best=0.52, avg=0.50, std=0.01, steps=3.082e+06
2023-07-07 10:29:27,040 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 400, best=0.51, avg=0.50, std=0.01, steps=4.106e+06
2023-07-07 10:29:36,547 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 500, best=0.51, avg=0.50, std=0.01, steps=5.130e+06
2023-07-07 10:29:46,075 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 600, best=0.51, avg=0.50, std=0.01, steps=6.154e+06
2023-07-07 10:29:55,593 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 700, best=0.51, avg=0.50, std=0.01, steps=7.178e+06
2023-07-07 10:30:05,122 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 800, best=0.51, avg=0.50, std=0.01, steps=8.202e+06
2023-07-07 10:30:14,613 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 900, best=0.52, avg=0.50, std=0.01, steps=9.226e+06
2023-07-07 10:30:24,094 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 1000, best=0.51, avg=0.50, std=0.01, steps=1.025e+07
2023-07-07 10:30:33,615 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 1100, best=0.52, avg=0.50, std=0.01, steps=1.127e+07
2023-07-07 10:30:43,162 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 1200, best=0.52, avg=0.50, std=0.01, steps=1.230e+07
2023-07-07 10:30:52,825 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 1300, best=0.51, avg=0.50, std=0.01, steps=1.332e+07
2023-07-07 10:31:02,424 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 1400, best=0.51, avg=0.50, std=0.01, steps=1.435e+07
2023-07-07 10:31:11,921 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 1500, best=0.51, avg=0.50, std=0.01, steps=1.537e+07
2023-07-07 10:31:21,378 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 1600, best=0.51, avg=0.50, std=0.00, steps=1.639e+07
2023-07-07 10:31:30,893 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 1700, best=0.51, avg=0.50, std=0.01, steps=1.742e+07
2023-07-07 10:31:40,429 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 1800, best=0.52, avg=0.50, std=0.01, steps=1.844e+07
2023-07-07 10:31:49,941 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 1900, best=0.52, avg=0.50, std=0.01, steps=1.947e+07
2023-07-07 10:31:59,460 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 2000, best=0.51, avg=0.50, std=0.01, steps=2.049e+07
2023-07-07 10:32:08,983 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 2100, best=0.51, avg=0.50, std=0.01, steps=2.151e+07
2023-07-07 10:32:18,495 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 2200, best=0.51, avg=0.50, std=0.00, steps=2.254e+07
2023-07-07 10:32:28,004 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 2300, best=0.52, avg=0.50, std=0.01, steps=2.356e+07
2023-07-07 10:32:37,504 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 2400, best=0.52, avg=0.50, std=0.01, steps=2.459e+07
2023-07-07 10:32:47,015 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 2500, best=0.51, avg=0.50, std=0.01, steps=2.561e+07
2023-07-07 10:32:56,509 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 2600, best=0.51, avg=0.50, std=0.01, steps=2.663e+07
2023-07-07 10:33:06,067 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 2700, best=0.52, avg=0.50, std=0.01, steps=2.766e+07
2023-07-07 10:33:15,617 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 2800, best=0.52, avg=0.50, std=0.01, steps=2.868e+07
2023-07-07 10:33:25,085 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 2900, best=0.51, avg=0.50, std=0.01, steps=2.971e+07
2023-07-07 10:33:34,593 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 3000, best=0.52, avg=0.50, std=0.01, steps=3.073e+07
2023-07-07 10:33:44,113 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 3100, best=0.51, avg=0.50, std=0.01, steps=3.175e+07
2023-07-07 10:33:53,624 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 3200, best=0.52, avg=0.50, std=0.01, steps=3.278e+07
2023-07-07 10:34:03,141 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 3300, best=0.51, avg=0.50, std=0.01, steps=3.380e+07
2023-07-07 10:34:12,667 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 3400, best=0.51, avg=0.50, std=0.01, steps=3.483e+07
2023-07-07 10:34:22,168 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 3500, best=0.51, avg=0.50, std=0.01, steps=3.585e+07
2023-07-07 10:34:31,671 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 3600, best=0.52, avg=0.50, std=0.01, steps=3.687e+07
2023-07-07 10:34:41,191 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 3700, best=0.51, avg=0.50, std=0.01, steps=3.790e+07
2023-07-07 10:34:50,691 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 3800, best=0.51, avg=0.50, std=0.01, steps=3.892e+07
2023-07-07 10:35:00,186 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 3900, best=0.51, avg=0.50, std=0.01, steps=3.995e+07
2023-07-07 10:35:09,697 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 4000, best=0.52, avg=0.50, std=0.01, steps=4.097e+07
2023-07-07 10:35:19,204 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 4100, best=0.51, avg=0.50, std=0.01, steps=4.199e+07
2023-07-07 10:35:28,711 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 4200, best=0.51, avg=0.50, std=0.00, steps=4.302e+07
2023-07-07 10:35:38,209 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 4300, best=0.52, avg=0.50, std=0.01, steps=4.404e+07
2023-07-07 10:35:47,688 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 4400, best=0.52, avg=0.50, std=0.01, steps=4.507e+07
2023-07-07 10:35:57,179 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 4500, best=0.52, avg=0.50, std=0.01, steps=4.609e+07
2023-07-07 10:36:06,707 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 4600, best=0.51, avg=0.50, std=0.01, steps=4.711e+07
2023-07-07 10:36:16,203 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 4700, best=0.51, avg=0.50, std=0.01, steps=4.814e+07
2023-07-07 10:36:25,702 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 4800, best=0.52, avg=0.50, std=0.01, steps=4.916e+07
2023-07-07 10:36:35,235 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 4900, best=0.52, avg=0.50, std=0.01, steps=5.019e+07
2023-07-07 10:36:44,753 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 5000, best=0.51, avg=0.50, std=0.01, steps=5.121e+07
2023-07-07 10:36:54,235 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 5100, best=0.52, avg=0.50, std=0.01, steps=5.223e+07
2023-07-07 10:37:03,722 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 5200, best=0.51, avg=0.50, std=0.01, steps=5.326e+07
2023-07-07 10:37:13,221 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 5300, best=0.51, avg=0.50, std=0.01, steps=5.428e+07
2023-07-07 10:37:22,708 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 5400, best=0.51, avg=0.50, std=0.01, steps=5.531e+07
2023-07-07 10:37:32,194 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 5500, best=0.51, avg=0.50, std=0.01, steps=5.633e+07
2023-07-07 10:37:41,696 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 5600, best=0.52, avg=0.50, std=0.01, steps=5.735e+07
2023-07-07 10:37:51,212 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 5700, best=0.51, avg=0.50, std=0.01, steps=5.838e+07
2023-07-07 10:38:00,723 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 5800, best=0.51, avg=0.50, std=0.01, steps=5.940e+07
2023-07-07 10:38:10,235 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 5900, best=0.51, avg=0.50, std=0.01, steps=6.043e+07
2023-07-07 10:38:19,770 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 6000, best=0.51, avg=0.50, std=0.01, steps=6.145e+07
2023-07-07 10:38:29,308 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 6100, best=0.52, avg=0.50, std=0.01, steps=6.247e+07
2023-07-07 10:38:38,835 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 6200, best=0.51, avg=0.50, std=0.01, steps=6.350e+07
2023-07-07 10:38:48,345 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 6300, best=0.51, avg=0.50, std=0.01, steps=6.452e+07
2023-07-07 10:38:57,836 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 6400, best=0.51, avg=0.50, std=0.00, steps=6.555e+07
2023-07-07 10:39:07,325 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 6500, best=0.51, avg=0.50, std=0.01, steps=6.657e+07
2023-07-07 10:39:16,785 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 6600, best=0.51, avg=0.50, std=0.01, steps=6.759e+07
2023-07-07 10:39:26,241 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 6700, best=0.52, avg=0.50, std=0.01, steps=6.862e+07
2023-07-07 10:39:35,738 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 6800, best=0.51, avg=0.50, std=0.01, steps=6.964e+07
2023-07-07 10:39:45,245 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 6900, best=0.51, avg=0.50, std=0.01, steps=7.067e+07
2023-07-07 10:39:54,743 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 7000, best=0.51, avg=0.50, std=0.01, steps=7.169e+07
2023-07-07 10:40:04,241 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 7100, best=0.52, avg=0.50, std=0.01, steps=7.271e+07
2023-07-07 10:40:13,731 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 7200, best=0.51, avg=0.50, std=0.01, steps=7.374e+07
2023-07-07 10:40:23,245 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 7300, best=0.51, avg=0.50, std=0.01, steps=7.476e+07
2023-07-07 10:40:32,753 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 7400, best=0.51, avg=0.50, std=0.01, steps=7.579e+07
2023-07-07 10:40:42,242 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 7500, best=0.52, avg=0.50, std=0.01, steps=7.681e+07
2023-07-07 10:40:51,735 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 7600, best=0.51, avg=0.50, std=0.01, steps=7.783e+07
2023-07-07 10:41:01,228 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 7700, best=0.52, avg=0.50, std=0.01, steps=7.886e+07
2023-07-07 10:41:10,741 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 7800, best=0.51, avg=0.50, std=0.01, steps=7.988e+07
2023-07-07 10:41:20,243 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 7900, best=0.51, avg=0.50, std=0.01, steps=8.091e+07
2023-07-07 10:41:29,745 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 8000, best=0.52, avg=0.50, std=0.01, steps=8.193e+07
2023-07-07 10:41:39,292 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 8100, best=0.52, avg=0.50, std=0.01, steps=8.295e+07
2023-07-07 10:41:48,815 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 8200, best=0.51, avg=0.50, std=0.01, steps=8.398e+07
2023-07-07 10:41:58,264 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 8300, best=0.51, avg=0.50, std=0.01, steps=8.500e+07
2023-07-07 10:42:07,715 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 8400, best=0.52, avg=0.50, std=0.01, steps=8.603e+07
2023-07-07 10:42:17,202 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 8500, best=0.51, avg=0.50, std=0.01, steps=8.705e+07
2023-07-07 10:42:26,698 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 8600, best=0.51, avg=0.50, std=0.01, steps=8.807e+07
2023-07-07 10:42:36,206 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 8700, best=0.51, avg=0.50, std=0.01, steps=8.910e+07
2023-07-07 10:42:45,705 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 8800, best=0.51, avg=0.50, std=0.01, steps=9.012e+07
2023-07-07 10:42:55,203 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 8900, best=0.51, avg=0.50, std=0.01, steps=9.115e+07
2023-07-07 10:43:04,698 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 9000, best=0.52, avg=0.50, std=0.01, steps=9.217e+07
2023-07-07 10:43:14,244 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 9100, best=0.52, avg=0.50, std=0.01, steps=9.319e+07
2023-07-07 10:43:23,773 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 9200, best=0.51, avg=0.50, std=0.01, steps=9.422e+07
2023-07-07 10:43:33,322 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 9300, best=0.51, avg=0.50, std=0.01, steps=9.524e+07
2023-07-07 10:43:42,926 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 9400, best=0.51, avg=0.50, std=0.01, steps=9.627e+07
2023-07-07 10:43:52,419 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 9500, best=0.52, avg=0.50, std=0.01, steps=9.729e+07
2023-07-07 10:44:01,877 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 9600, best=0.51, avg=0.50, std=0.00, steps=9.831e+07
2023-07-07 10:44:11,356 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 9700, best=0.51, avg=0.50, std=0.01, steps=9.934e+07
2023-07-07 10:44:20,888 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 9800, best=0.51, avg=0.50, std=0.01, steps=1.004e+08
2023-07-07 10:44:30,412 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 9900, best=0.66, avg=0.65, std=0.00, steps=1.014e+08
2023-07-07 10:44:39,933 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 10000, best=0.68, avg=0.68, std=0.00, steps=1.024e+08
2023-07-07 10:44:49,439 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 10100, best=0.70, avg=0.69, std=0.00, steps=1.034e+08
2023-07-07 10:44:58,931 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 10200, best=0.71, avg=0.70, std=0.00, steps=1.045e+08
2023-07-07 10:45:08,422 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 10300, best=0.72, avg=0.70, std=0.00, steps=1.055e+08
2023-07-07 10:45:17,909 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 10400, best=0.72, avg=0.71, std=0.00, steps=1.065e+08
2023-07-07 10:45:27,415 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 10500, best=0.73, avg=0.72, std=0.00, steps=1.075e+08
2023-07-07 10:45:36,928 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 10600, best=0.73, avg=0.72, std=0.00, steps=1.086e+08
2023-07-07 10:45:46,432 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 10700, best=0.74, avg=0.73, std=0.00, steps=1.096e+08
2023-07-07 10:45:55,903 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 10800, best=0.75, avg=0.73, std=0.00, steps=1.106e+08
2023-07-07 10:46:05,376 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 10900, best=0.75, avg=0.74, std=0.00, steps=1.116e+08
2023-07-07 10:46:14,855 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 11000, best=0.75, avg=0.74, std=0.00, steps=1.127e+08
2023-07-07 10:46:24,333 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 11100, best=0.76, avg=0.75, std=0.00, steps=1.137e+08
2023-07-07 10:46:33,862 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 11200, best=0.76, avg=0.75, std=0.00, steps=1.147e+08
2023-07-07 10:46:43,347 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 11300, best=0.77, avg=0.75, std=0.00, steps=1.157e+08
2023-07-07 10:46:52,846 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 11400, best=0.77, avg=0.76, std=0.00, steps=1.167e+08
2023-07-07 10:47:02,357 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 11500, best=0.77, avg=0.76, std=0.00, steps=1.178e+08
2023-07-07 10:47:11,861 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 11600, best=0.77, avg=0.76, std=0.00, steps=1.188e+08
2023-07-07 10:47:21,341 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 11700, best=0.78, avg=0.77, std=0.00, steps=1.198e+08
2023-07-07 10:47:30,845 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 11800, best=0.78, avg=0.77, std=0.00, steps=1.208e+08
2023-07-07 10:47:40,354 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 11900, best=0.79, avg=0.77, std=0.00, steps=1.219e+08
2023-07-07 10:47:49,729 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 8, 1, [Train]: 11999, best=0.79, avg=0.78, std=0.00, steps=1.229e+08
2023-07-07 10:47:49,730 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 10:47:49,752 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 10:47:49,784 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 10:48:03,065 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 100, best=0.51, avg=0.50, std=0.01, steps=1.241e+06
2023-07-07 10:48:14,419 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 200, best=0.51, avg=0.50, std=0.01, steps=2.470e+06
2023-07-07 10:48:25,761 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 300, best=0.52, avg=0.50, std=0.01, steps=3.699e+06
2023-07-07 10:48:37,116 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 400, best=0.51, avg=0.50, std=0.01, steps=4.927e+06
2023-07-07 10:48:48,456 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 500, best=0.51, avg=0.50, std=0.01, steps=6.156e+06
2023-07-07 10:48:59,784 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 600, best=0.51, avg=0.50, std=0.01, steps=7.385e+06
2023-07-07 10:49:11,106 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 700, best=0.51, avg=0.50, std=0.01, steps=8.614e+06
2023-07-07 10:49:22,453 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 800, best=0.51, avg=0.50, std=0.01, steps=9.843e+06
2023-07-07 10:49:33,799 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 900, best=0.52, avg=0.50, std=0.01, steps=1.107e+07
2023-07-07 10:49:45,150 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 1000, best=0.51, avg=0.50, std=0.01, steps=1.230e+07
2023-07-07 10:49:56,631 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 1100, best=0.52, avg=0.50, std=0.01, steps=1.353e+07
2023-07-07 10:50:08,075 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 1200, best=0.52, avg=0.50, std=0.01, steps=1.476e+07
2023-07-07 10:50:19,410 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 1300, best=0.51, avg=0.50, std=0.01, steps=1.599e+07
2023-07-07 10:50:30,785 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 1400, best=0.51, avg=0.50, std=0.01, steps=1.722e+07
2023-07-07 10:50:42,149 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 1500, best=0.51, avg=0.50, std=0.01, steps=1.844e+07
2023-07-07 10:50:53,497 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 1600, best=0.51, avg=0.50, std=0.00, steps=1.967e+07
2023-07-07 10:51:04,849 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 1700, best=0.51, avg=0.50, std=0.01, steps=2.090e+07
2023-07-07 10:51:16,218 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 1800, best=0.52, avg=0.50, std=0.01, steps=2.213e+07
2023-07-07 10:51:27,603 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 1900, best=0.52, avg=0.50, std=0.01, steps=2.336e+07
2023-07-07 10:51:38,960 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 2000, best=0.51, avg=0.50, std=0.01, steps=2.459e+07
2023-07-07 10:51:50,336 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 2100, best=0.51, avg=0.50, std=0.01, steps=2.582e+07
2023-07-07 10:52:01,791 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 2200, best=0.51, avg=0.50, std=0.00, steps=2.705e+07
2023-07-07 10:52:13,118 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 2300, best=0.52, avg=0.50, std=0.01, steps=2.827e+07
2023-07-07 10:52:24,437 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 2400, best=0.52, avg=0.50, std=0.01, steps=2.950e+07
2023-07-07 10:52:35,788 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 2500, best=0.51, avg=0.50, std=0.01, steps=3.073e+07
2023-07-07 10:52:47,134 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 2600, best=0.60, avg=0.59, std=0.00, steps=3.196e+07
2023-07-07 10:52:58,472 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 2700, best=0.62, avg=0.62, std=0.00, steps=3.319e+07
2023-07-07 10:53:09,782 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 2800, best=0.66, avg=0.64, std=0.00, steps=3.442e+07
2023-07-07 10:53:21,134 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 2900, best=0.66, avg=0.65, std=0.00, steps=3.565e+07
2023-07-07 10:53:32,486 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 3000, best=0.67, avg=0.66, std=0.00, steps=3.688e+07
2023-07-07 10:53:43,847 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 3100, best=0.68, avg=0.67, std=0.00, steps=3.811e+07
2023-07-07 10:53:55,198 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 3200, best=0.69, avg=0.68, std=0.00, steps=3.933e+07
2023-07-07 10:54:06,542 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 3300, best=0.70, avg=0.69, std=0.00, steps=4.056e+07
2023-07-07 10:54:17,978 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 3400, best=0.70, avg=0.69, std=0.00, steps=4.179e+07
2023-07-07 10:54:29,346 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 3500, best=0.71, avg=0.70, std=0.00, steps=4.302e+07
2023-07-07 10:54:40,692 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 3600, best=0.71, avg=0.70, std=0.00, steps=4.425e+07
2023-07-07 10:54:52,076 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 3700, best=0.71, avg=0.70, std=0.00, steps=4.548e+07
2023-07-07 10:55:03,432 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 3800, best=0.72, avg=0.71, std=0.00, steps=4.671e+07
2023-07-07 10:55:14,783 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 3900, best=0.72, avg=0.71, std=0.00, steps=4.794e+07
2023-07-07 10:55:26,068 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 4000, best=0.72, avg=0.71, std=0.00, steps=4.916e+07
2023-07-07 10:55:37,379 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 4100, best=0.73, avg=0.72, std=0.00, steps=5.039e+07
2023-07-07 10:55:48,710 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 4200, best=0.73, avg=0.72, std=0.00, steps=5.162e+07
2023-07-07 10:56:00,053 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 4300, best=0.74, avg=0.72, std=0.00, steps=5.285e+07
2023-07-07 10:56:11,556 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 4400, best=0.74, avg=0.73, std=0.00, steps=5.408e+07
2023-07-07 10:56:22,993 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 4500, best=0.74, avg=0.73, std=0.00, steps=5.531e+07
2023-07-07 10:56:34,348 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 4600, best=0.74, avg=0.73, std=0.00, steps=5.654e+07
2023-07-07 10:56:45,668 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 4700, best=0.74, avg=0.73, std=0.00, steps=5.777e+07
2023-07-07 10:56:56,998 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 4800, best=0.75, avg=0.74, std=0.00, steps=5.899e+07
2023-07-07 10:57:08,353 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 4900, best=0.75, avg=0.74, std=0.00, steps=6.022e+07
2023-07-07 10:57:19,629 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 5000, best=0.75, avg=0.74, std=0.00, steps=6.145e+07
2023-07-07 10:57:30,973 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 5100, best=0.75, avg=0.74, std=0.00, steps=6.268e+07
2023-07-07 10:57:42,299 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 5200, best=0.75, avg=0.74, std=0.00, steps=6.391e+07
2023-07-07 10:57:53,637 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 5300, best=0.76, avg=0.74, std=0.00, steps=6.514e+07
2023-07-07 10:58:04,966 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 5400, best=0.76, avg=0.74, std=0.00, steps=6.637e+07
2023-07-07 10:58:16,391 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 5500, best=0.76, avg=0.74, std=0.00, steps=6.760e+07
2023-07-07 10:58:27,745 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 5600, best=0.75, avg=0.75, std=0.00, steps=6.883e+07
2023-07-07 10:58:39,131 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 5700, best=0.76, avg=0.75, std=0.00, steps=7.005e+07
2023-07-07 10:58:50,471 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 5800, best=0.76, avg=0.75, std=0.00, steps=7.128e+07
2023-07-07 10:59:01,815 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 5900, best=0.76, avg=0.75, std=0.00, steps=7.251e+07
2023-07-07 10:59:13,154 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 6000, best=0.76, avg=0.75, std=0.00, steps=7.374e+07
2023-07-07 10:59:24,475 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 6100, best=0.76, avg=0.75, std=0.00, steps=7.497e+07
2023-07-07 10:59:35,844 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 6200, best=0.76, avg=0.75, std=0.00, steps=7.620e+07
2023-07-07 10:59:47,203 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 6300, best=0.76, avg=0.75, std=0.00, steps=7.743e+07
2023-07-07 10:59:58,535 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 6400, best=0.77, avg=0.75, std=0.00, steps=7.866e+07
2023-07-07 11:00:09,832 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 6500, best=0.76, avg=0.75, std=0.00, steps=7.988e+07
2023-07-07 11:00:21,127 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 6600, best=0.76, avg=0.76, std=0.00, steps=8.111e+07
2023-07-07 11:00:32,423 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 6700, best=0.77, avg=0.76, std=0.00, steps=8.234e+07
2023-07-07 11:00:43,741 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 6800, best=0.77, avg=0.76, std=0.00, steps=8.357e+07
2023-07-07 11:00:55,062 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 6900, best=0.77, avg=0.76, std=0.00, steps=8.480e+07
2023-07-07 11:01:06,410 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 7000, best=0.77, avg=0.76, std=0.00, steps=8.603e+07
2023-07-07 11:01:17,717 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 7100, best=0.77, avg=0.76, std=0.00, steps=8.726e+07
2023-07-07 11:01:29,066 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 7200, best=0.77, avg=0.76, std=0.00, steps=8.849e+07
2023-07-07 11:01:40,446 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 7300, best=0.77, avg=0.76, std=0.00, steps=8.971e+07
2023-07-07 11:01:51,827 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 7400, best=0.77, avg=0.76, std=0.00, steps=9.094e+07
2023-07-07 11:02:03,163 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 7500, best=0.77, avg=0.76, std=0.00, steps=9.217e+07
2023-07-07 11:02:14,509 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 7600, best=0.78, avg=0.77, std=0.00, steps=9.340e+07
2023-07-07 11:02:25,871 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 7700, best=0.78, avg=0.77, std=0.00, steps=9.463e+07
2023-07-07 11:02:37,342 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 7800, best=0.78, avg=0.77, std=0.00, steps=9.586e+07
2023-07-07 11:02:48,761 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 7900, best=0.78, avg=0.77, std=0.00, steps=9.709e+07
2023-07-07 11:03:00,115 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 8000, best=0.78, avg=0.77, std=0.00, steps=9.832e+07
2023-07-07 11:03:11,478 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 8100, best=0.78, avg=0.77, std=0.00, steps=9.955e+07
2023-07-07 11:03:22,821 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 8200, best=0.78, avg=0.77, std=0.00, steps=1.008e+08
2023-07-07 11:03:34,172 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 8300, best=0.78, avg=0.77, std=0.00, steps=1.020e+08
2023-07-07 11:03:45,492 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 8400, best=0.78, avg=0.77, std=0.00, steps=1.032e+08
2023-07-07 11:03:56,831 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 8500, best=0.78, avg=0.77, std=0.00, steps=1.045e+08
2023-07-07 11:04:08,182 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 8600, best=0.78, avg=0.77, std=0.00, steps=1.057e+08
2023-07-07 11:04:19,531 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 8700, best=0.78, avg=0.77, std=0.00, steps=1.069e+08
2023-07-07 11:04:30,872 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 8800, best=0.79, avg=0.78, std=0.00, steps=1.081e+08
2023-07-07 11:04:42,245 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 8900, best=0.79, avg=0.78, std=0.00, steps=1.094e+08
2023-07-07 11:04:53,556 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 9000, best=0.79, avg=0.78, std=0.00, steps=1.106e+08
2023-07-07 11:05:04,845 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 9100, best=0.79, avg=0.78, std=0.00, steps=1.118e+08
2023-07-07 11:05:16,195 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 9200, best=0.78, avg=0.78, std=0.00, steps=1.131e+08
2023-07-07 11:05:27,560 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 9300, best=0.79, avg=0.78, std=0.00, steps=1.143e+08
2023-07-07 11:05:38,916 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 9400, best=0.79, avg=0.78, std=0.00, steps=1.155e+08
2023-07-07 11:05:50,234 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 9500, best=0.79, avg=0.78, std=0.00, steps=1.167e+08
2023-07-07 11:06:01,555 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 9600, best=0.79, avg=0.78, std=0.00, steps=1.180e+08
2023-07-07 11:06:12,866 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 9700, best=0.79, avg=0.78, std=0.00, steps=1.192e+08
2023-07-07 11:06:24,217 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 9800, best=0.79, avg=0.78, std=0.00, steps=1.204e+08
2023-07-07 11:06:35,558 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 9900, best=0.79, avg=0.78, std=0.00, steps=1.217e+08
2023-07-07 11:06:46,930 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 10000, best=0.79, avg=0.78, std=0.00, steps=1.229e+08
2023-07-07 11:06:58,273 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 10100, best=0.79, avg=0.78, std=0.00, steps=1.241e+08
2023-07-07 11:07:09,602 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 10200, best=0.79, avg=0.78, std=0.00, steps=1.253e+08
2023-07-07 11:07:20,975 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 10300, best=0.80, avg=0.78, std=0.00, steps=1.266e+08
2023-07-07 11:07:32,333 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 10400, best=0.79, avg=0.78, std=0.00, steps=1.278e+08
2023-07-07 11:07:43,706 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 10500, best=0.79, avg=0.79, std=0.00, steps=1.290e+08
2023-07-07 11:07:55,058 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 10600, best=0.79, avg=0.78, std=0.00, steps=1.303e+08
2023-07-07 11:08:06,389 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 10700, best=0.79, avg=0.78, std=0.00, steps=1.315e+08
2023-07-07 11:08:17,707 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 10800, best=0.79, avg=0.79, std=0.00, steps=1.327e+08
2023-07-07 11:08:29,070 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 10900, best=0.79, avg=0.79, std=0.00, steps=1.340e+08
2023-07-07 11:08:40,423 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 11000, best=0.80, avg=0.79, std=0.00, steps=1.352e+08
2023-07-07 11:08:51,765 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 11100, best=0.79, avg=0.79, std=0.00, steps=1.364e+08
2023-07-07 11:09:03,105 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 11200, best=0.80, avg=0.79, std=0.00, steps=1.376e+08
2023-07-07 11:09:14,416 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 11300, best=0.80, avg=0.79, std=0.00, steps=1.389e+08
2023-07-07 11:09:25,744 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 11400, best=0.80, avg=0.79, std=0.00, steps=1.401e+08
2023-07-07 11:09:37,116 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 11500, best=0.80, avg=0.79, std=0.00, steps=1.413e+08
2023-07-07 11:09:48,463 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 11600, best=0.80, avg=0.79, std=0.00, steps=1.426e+08
2023-07-07 11:09:59,765 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 11700, best=0.80, avg=0.79, std=0.00, steps=1.438e+08
2023-07-07 11:10:11,007 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 11800, best=0.80, avg=0.79, std=0.00, steps=1.450e+08
2023-07-07 11:10:22,342 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 11900, best=0.80, avg=0.79, std=0.00, steps=1.462e+08
2023-07-07 11:10:33,595 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 16, 1, [Train]: 11999, best=0.80, avg=0.79, std=0.00, steps=1.475e+08
2023-07-07 11:10:33,596 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 11:10:33,621 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 11:10:33,656 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 11:10:50,632 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 100, best=0.51, avg=0.50, std=0.01, steps=1.655e+06
2023-07-07 11:11:05,693 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 200, best=0.51, avg=0.50, std=0.01, steps=3.293e+06
2023-07-07 11:11:20,717 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 300, best=0.52, avg=0.50, std=0.01, steps=4.932e+06
2023-07-07 11:11:35,839 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 400, best=0.51, avg=0.50, std=0.01, steps=6.570e+06
2023-07-07 11:11:50,905 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 500, best=0.51, avg=0.50, std=0.01, steps=8.208e+06
2023-07-07 11:12:05,941 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 600, best=0.51, avg=0.50, std=0.01, steps=9.847e+06
2023-07-07 11:12:20,959 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 700, best=0.51, avg=0.50, std=0.01, steps=1.149e+07
2023-07-07 11:12:35,997 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 800, best=0.51, avg=0.50, std=0.01, steps=1.312e+07
2023-07-07 11:12:51,036 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 900, best=0.52, avg=0.50, std=0.01, steps=1.476e+07
2023-07-07 11:13:06,030 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 1000, best=0.51, avg=0.50, std=0.01, steps=1.640e+07
2023-07-07 11:13:21,132 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 1100, best=0.52, avg=0.50, std=0.01, steps=1.804e+07
2023-07-07 11:13:36,180 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 1200, best=0.52, avg=0.50, std=0.01, steps=1.968e+07
2023-07-07 11:13:51,222 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 1300, best=0.51, avg=0.50, std=0.01, steps=2.132e+07
2023-07-07 11:14:06,233 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 1400, best=0.51, avg=0.50, std=0.01, steps=2.295e+07
2023-07-07 11:14:21,258 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 1500, best=0.52, avg=0.50, std=0.01, steps=2.459e+07
2023-07-07 11:14:36,310 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 1600, best=0.51, avg=0.50, std=0.00, steps=2.623e+07
2023-07-07 11:14:51,344 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 1700, best=0.51, avg=0.50, std=0.01, steps=2.787e+07
2023-07-07 11:15:06,364 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 1800, best=0.51, avg=0.50, std=0.01, steps=2.951e+07
2023-07-07 11:15:21,386 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 1900, best=0.51, avg=0.50, std=0.01, steps=3.115e+07
2023-07-07 11:15:36,570 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 2000, best=0.51, avg=0.50, std=0.01, steps=3.278e+07
2023-07-07 11:15:51,598 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 2100, best=0.52, avg=0.50, std=0.01, steps=3.442e+07
2023-07-07 11:16:06,592 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 2200, best=0.51, avg=0.50, std=0.00, steps=3.606e+07
2023-07-07 11:16:21,593 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 2300, best=0.52, avg=0.50, std=0.01, steps=3.770e+07
2023-07-07 11:16:36,573 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 2400, best=0.51, avg=0.50, std=0.01, steps=3.934e+07
2023-07-07 11:16:51,622 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 2500, best=0.51, avg=0.50, std=0.01, steps=4.098e+07
2023-07-07 11:17:06,671 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 2600, best=0.51, avg=0.50, std=0.01, steps=4.261e+07
2023-07-07 11:17:21,683 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 2700, best=0.51, avg=0.50, std=0.01, steps=4.425e+07
2023-07-07 11:17:36,779 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 2800, best=0.52, avg=0.50, std=0.01, steps=4.589e+07
2023-07-07 11:17:51,775 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 2900, best=0.52, avg=0.50, std=0.01, steps=4.753e+07
2023-07-07 11:18:06,838 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 3000, best=0.51, avg=0.50, std=0.01, steps=4.917e+07
2023-07-07 11:18:21,872 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 3100, best=0.51, avg=0.50, std=0.01, steps=5.081e+07
2023-07-07 11:18:36,864 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 3200, best=0.51, avg=0.50, std=0.01, steps=5.245e+07
2023-07-07 11:18:51,798 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 3300, best=0.51, avg=0.50, std=0.01, steps=5.408e+07
2023-07-07 11:19:06,792 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 3400, best=0.51, avg=0.50, std=0.01, steps=5.572e+07
2023-07-07 11:19:21,767 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 3500, best=0.51, avg=0.50, std=0.01, steps=5.736e+07
2023-07-07 11:19:36,762 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 3600, best=0.52, avg=0.50, std=0.01, steps=5.900e+07
2023-07-07 11:19:51,858 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 3700, best=0.51, avg=0.50, std=0.01, steps=6.064e+07
2023-07-07 11:20:06,873 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 3800, best=0.51, avg=0.50, std=0.01, steps=6.228e+07
2023-07-07 11:20:21,870 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 3900, best=0.51, avg=0.50, std=0.01, steps=6.391e+07
2023-07-07 11:20:36,836 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 4000, best=0.52, avg=0.50, std=0.01, steps=6.555e+07
2023-07-07 11:20:51,807 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 4100, best=0.52, avg=0.50, std=0.01, steps=6.719e+07
2023-07-07 11:21:06,798 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 4200, best=0.51, avg=0.50, std=0.00, steps=6.883e+07
2023-07-07 11:21:21,799 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 4300, best=0.51, avg=0.50, std=0.01, steps=7.047e+07
2023-07-07 11:21:36,765 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 4400, best=0.52, avg=0.50, std=0.01, steps=7.211e+07
2023-07-07 11:21:51,788 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 4500, best=0.51, avg=0.50, std=0.01, steps=7.374e+07
2023-07-07 11:22:06,804 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 4600, best=0.52, avg=0.50, std=0.01, steps=7.538e+07
2023-07-07 11:22:21,802 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 4700, best=0.52, avg=0.50, std=0.01, steps=7.702e+07
2023-07-07 11:22:36,828 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 4800, best=0.51, avg=0.50, std=0.01, steps=7.866e+07
2023-07-07 11:22:51,811 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 4900, best=0.51, avg=0.50, std=0.01, steps=8.030e+07
2023-07-07 11:23:06,784 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 5000, best=0.51, avg=0.50, std=0.01, steps=8.194e+07
2023-07-07 11:23:21,761 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 5100, best=0.51, avg=0.50, std=0.01, steps=8.357e+07
2023-07-07 11:23:36,773 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 5200, best=0.52, avg=0.50, std=0.01, steps=8.521e+07
2023-07-07 11:23:51,829 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 5300, best=0.52, avg=0.50, std=0.01, steps=8.685e+07
2023-07-07 11:24:06,821 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 5400, best=0.51, avg=0.50, std=0.01, steps=8.849e+07
2023-07-07 11:24:21,826 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 5500, best=0.52, avg=0.50, std=0.01, steps=9.013e+07
2023-07-07 11:24:36,817 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 5600, best=0.51, avg=0.50, std=0.01, steps=9.177e+07
2023-07-07 11:24:51,815 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 5700, best=0.51, avg=0.50, std=0.01, steps=9.341e+07
2023-07-07 11:25:06,826 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 5800, best=0.51, avg=0.50, std=0.01, steps=9.504e+07
2023-07-07 11:25:21,859 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 5900, best=0.51, avg=0.50, std=0.01, steps=9.668e+07
2023-07-07 11:25:36,917 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 6000, best=0.51, avg=0.50, std=0.01, steps=9.832e+07
2023-07-07 11:25:51,904 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 6100, best=0.51, avg=0.50, std=0.01, steps=9.996e+07
2023-07-07 11:26:06,948 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 6200, best=0.52, avg=0.50, std=0.01, steps=1.016e+08
2023-07-07 11:26:22,003 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 6300, best=0.52, avg=0.50, std=0.01, steps=1.032e+08
2023-07-07 11:26:37,070 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 6400, best=0.51, avg=0.50, std=0.00, steps=1.049e+08
2023-07-07 11:26:52,086 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 6500, best=0.51, avg=0.50, std=0.01, steps=1.065e+08
2023-07-07 11:27:07,117 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 6600, best=0.51, avg=0.50, std=0.01, steps=1.082e+08
2023-07-07 11:27:22,130 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 6700, best=0.52, avg=0.50, std=0.01, steps=1.098e+08
2023-07-07 11:27:37,113 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 6800, best=0.51, avg=0.50, std=0.01, steps=1.114e+08
2023-07-07 11:27:52,105 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 6900, best=0.51, avg=0.50, std=0.01, steps=1.131e+08
2023-07-07 11:28:07,136 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 7000, best=0.51, avg=0.50, std=0.01, steps=1.147e+08
2023-07-07 11:28:22,190 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 7100, best=0.52, avg=0.50, std=0.01, steps=1.163e+08
2023-07-07 11:28:37,227 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 7200, best=0.52, avg=0.50, std=0.01, steps=1.180e+08
2023-07-07 11:28:52,213 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 7300, best=0.52, avg=0.50, std=0.01, steps=1.196e+08
2023-07-07 11:29:07,185 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 7400, best=0.51, avg=0.50, std=0.01, steps=1.213e+08
2023-07-07 11:29:22,144 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 7500, best=0.51, avg=0.50, std=0.01, steps=1.229e+08
2023-07-07 11:29:37,141 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 7600, best=0.52, avg=0.50, std=0.01, steps=1.245e+08
2023-07-07 11:29:52,121 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 7700, best=0.51, avg=0.50, std=0.01, steps=1.262e+08
2023-07-07 11:30:07,099 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 7800, best=0.51, avg=0.50, std=0.01, steps=1.278e+08
2023-07-07 11:30:22,166 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 7900, best=0.52, avg=0.50, std=0.01, steps=1.294e+08
2023-07-07 11:30:37,162 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 8000, best=0.51, avg=0.50, std=0.01, steps=1.311e+08
2023-07-07 11:30:52,196 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 8100, best=0.52, avg=0.50, std=0.01, steps=1.327e+08
2023-07-07 11:31:07,221 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 8200, best=0.51, avg=0.50, std=0.01, steps=1.344e+08
2023-07-07 11:31:22,247 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 8300, best=0.51, avg=0.50, std=0.01, steps=1.360e+08
2023-07-07 11:31:37,225 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 8400, best=0.51, avg=0.50, std=0.01, steps=1.376e+08
2023-07-07 11:31:52,239 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 8500, best=0.51, avg=0.50, std=0.01, steps=1.393e+08
2023-07-07 11:32:07,247 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 8600, best=0.52, avg=0.50, std=0.01, steps=1.409e+08
2023-07-07 11:32:22,275 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 8700, best=0.51, avg=0.50, std=0.01, steps=1.426e+08
2023-07-07 11:32:37,331 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 8800, best=0.51, avg=0.50, std=0.01, steps=1.442e+08
2023-07-07 11:32:52,320 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 8900, best=0.52, avg=0.50, std=0.01, steps=1.458e+08
2023-07-07 11:33:07,323 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 9000, best=0.51, avg=0.50, std=0.01, steps=1.475e+08
2023-07-07 11:33:22,320 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 9100, best=0.51, avg=0.50, std=0.01, steps=1.491e+08
2023-07-07 11:33:37,371 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 9200, best=0.51, avg=0.50, std=0.01, steps=1.507e+08
2023-07-07 11:33:52,424 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 9300, best=0.52, avg=0.50, std=0.01, steps=1.524e+08
2023-07-07 11:34:07,455 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 9400, best=0.51, avg=0.50, std=0.01, steps=1.540e+08
2023-07-07 11:34:22,516 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 9500, best=0.51, avg=0.50, std=0.01, steps=1.557e+08
2023-07-07 11:34:37,530 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 9600, best=0.52, avg=0.50, std=0.00, steps=1.573e+08
2023-07-07 11:34:52,555 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 9700, best=0.51, avg=0.50, std=0.01, steps=1.589e+08
2023-07-07 11:35:07,533 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 9800, best=0.52, avg=0.50, std=0.01, steps=1.606e+08
2023-07-07 11:35:22,481 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 9900, best=0.51, avg=0.50, std=0.01, steps=1.622e+08
2023-07-07 11:35:37,373 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 10000, best=0.51, avg=0.50, std=0.01, steps=1.639e+08
2023-07-07 11:35:52,341 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 10100, best=0.51, avg=0.50, std=0.01, steps=1.655e+08
2023-07-07 11:36:07,329 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 10200, best=0.52, avg=0.50, std=0.01, steps=1.671e+08
2023-07-07 11:36:22,371 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 10300, best=0.52, avg=0.50, std=0.01, steps=1.688e+08
2023-07-07 11:36:37,391 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 10400, best=0.51, avg=0.50, std=0.01, steps=1.704e+08
2023-07-07 11:36:52,387 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 10500, best=0.52, avg=0.50, std=0.01, steps=1.720e+08
2023-07-07 11:37:07,357 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 10600, best=0.51, avg=0.50, std=0.01, steps=1.737e+08
2023-07-07 11:37:22,374 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 10700, best=0.51, avg=0.50, std=0.01, steps=1.753e+08
2023-07-07 11:37:37,412 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 10800, best=0.52, avg=0.50, std=0.01, steps=1.770e+08
2023-07-07 11:37:52,439 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 10900, best=0.52, avg=0.50, std=0.01, steps=1.786e+08
2023-07-07 11:38:07,470 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 11000, best=0.51, avg=0.50, std=0.01, steps=1.802e+08
2023-07-07 11:38:22,494 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 11100, best=0.52, avg=0.50, std=0.01, steps=1.819e+08
2023-07-07 11:38:37,585 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 11200, best=0.51, avg=0.50, std=0.01, steps=1.835e+08
2023-07-07 11:38:52,619 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 11300, best=0.51, avg=0.50, std=0.00, steps=1.852e+08
2023-07-07 11:39:07,637 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 11400, best=0.51, avg=0.50, std=0.01, steps=1.868e+08
2023-07-07 11:39:22,661 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 11500, best=0.51, avg=0.50, std=0.01, steps=1.884e+08
2023-07-07 11:39:37,684 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 11600, best=0.51, avg=0.50, std=0.01, steps=1.901e+08
2023-07-07 11:39:52,772 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 11700, best=0.51, avg=0.50, std=0.01, steps=1.917e+08
2023-07-07 11:40:07,844 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 11800, best=0.52, avg=0.50, std=0.01, steps=1.933e+08
2023-07-07 11:40:22,891 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 11900, best=0.51, avg=0.50, std=0.01, steps=1.950e+08
2023-07-07 11:40:37,766 -        meta learning: [    INFO] - [Len Lat Rep]: 16, 32, 1, [Train]: 11999, best=0.51, avg=0.50, std=0.01, steps=1.966e+08
2023-07-07 11:40:37,766 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 11:40:37,791 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 11:40:37,825 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 11:40:54,604 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 100, best=0.51, avg=0.50, std=0.00, steps=1.655e+06
2023-07-07 11:41:09,739 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 200, best=0.62, avg=0.61, std=0.00, steps=3.293e+06
2023-07-07 11:41:24,789 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 300, best=0.65, avg=0.64, std=0.00, steps=4.932e+06
2023-07-07 11:41:39,901 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 400, best=0.67, avg=0.66, std=0.00, steps=6.570e+06
2023-07-07 11:41:54,969 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 500, best=0.68, avg=0.67, std=0.00, steps=8.208e+06
2023-07-07 11:42:09,949 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 600, best=0.69, avg=0.68, std=0.00, steps=9.847e+06
2023-07-07 11:42:24,955 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 700, best=0.69, avg=0.69, std=0.00, steps=1.149e+07
2023-07-07 11:42:39,967 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 800, best=0.70, avg=0.69, std=0.00, steps=1.312e+07
2023-07-07 11:42:54,945 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 900, best=0.71, avg=0.70, std=0.00, steps=1.476e+07
2023-07-07 11:43:09,997 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 1000, best=0.71, avg=0.70, std=0.00, steps=1.640e+07
2023-07-07 11:43:25,062 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 1100, best=0.71, avg=0.71, std=0.00, steps=1.804e+07
2023-07-07 11:43:40,123 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 1200, best=0.71, avg=0.71, std=0.00, steps=1.968e+07
2023-07-07 11:43:55,143 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 1300, best=0.72, avg=0.71, std=0.00, steps=2.132e+07
2023-07-07 11:44:10,149 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 1400, best=0.72, avg=0.71, std=0.00, steps=2.295e+07
2023-07-07 11:44:25,154 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 1500, best=0.72, avg=0.72, std=0.00, steps=2.459e+07
2023-07-07 11:44:40,141 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 1600, best=0.73, avg=0.72, std=0.00, steps=2.623e+07
2023-07-07 11:44:55,121 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 1700, best=0.73, avg=0.72, std=0.00, steps=2.787e+07
2023-07-07 11:45:10,201 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 1800, best=0.73, avg=0.72, std=0.00, steps=2.951e+07
2023-07-07 11:45:25,208 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 1900, best=0.73, avg=0.72, std=0.00, steps=3.115e+07
2023-07-07 11:45:40,242 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 2000, best=0.73, avg=0.73, std=0.00, steps=3.278e+07
2023-07-07 11:45:55,281 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 2100, best=0.73, avg=0.73, std=0.00, steps=3.442e+07
2023-07-07 11:46:10,280 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 2200, best=0.73, avg=0.73, std=0.00, steps=3.606e+07
2023-07-07 11:46:25,341 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 2300, best=0.74, avg=0.73, std=0.00, steps=3.770e+07
2023-07-07 11:46:40,375 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 2400, best=0.74, avg=0.73, std=0.00, steps=3.934e+07
2023-07-07 11:46:55,410 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 2500, best=0.74, avg=0.73, std=0.00, steps=4.098e+07
2023-07-07 11:47:10,485 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 2600, best=0.74, avg=0.73, std=0.00, steps=4.261e+07
2023-07-07 11:47:25,557 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 2700, best=0.74, avg=0.74, std=0.00, steps=4.425e+07
2023-07-07 11:47:40,535 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 2800, best=0.75, avg=0.74, std=0.00, steps=4.589e+07
2023-07-07 11:47:55,541 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 2900, best=0.75, avg=0.74, std=0.00, steps=4.753e+07
2023-07-07 11:48:10,594 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 3000, best=0.75, avg=0.74, std=0.00, steps=4.917e+07
2023-07-07 11:48:25,640 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 3100, best=0.75, avg=0.74, std=0.00, steps=5.081e+07
2023-07-07 11:48:40,712 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 3200, best=0.75, avg=0.74, std=0.00, steps=5.245e+07
2023-07-07 11:48:55,770 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 3300, best=0.75, avg=0.74, std=0.00, steps=5.408e+07
2023-07-07 11:49:10,818 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 3400, best=0.75, avg=0.75, std=0.00, steps=5.572e+07
2023-07-07 11:49:25,811 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 3500, best=0.75, avg=0.75, std=0.00, steps=5.736e+07
2023-07-07 11:49:40,914 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 3600, best=0.76, avg=0.75, std=0.00, steps=5.900e+07
2023-07-07 11:49:55,900 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 3700, best=0.76, avg=0.75, std=0.00, steps=6.064e+07
2023-07-07 11:50:10,953 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 3800, best=0.76, avg=0.75, std=0.00, steps=6.228e+07
2023-07-07 11:50:25,963 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 3900, best=0.76, avg=0.75, std=0.00, steps=6.391e+07
2023-07-07 11:50:41,015 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 4000, best=0.76, avg=0.75, std=0.00, steps=6.555e+07
2023-07-07 11:50:56,040 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 4100, best=0.76, avg=0.75, std=0.00, steps=6.719e+07
2023-07-07 11:51:11,042 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 4200, best=0.76, avg=0.75, std=0.00, steps=6.883e+07
2023-07-07 11:51:26,061 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 4300, best=0.77, avg=0.75, std=0.00, steps=7.047e+07
2023-07-07 11:51:41,065 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 4400, best=0.77, avg=0.76, std=0.00, steps=7.211e+07
2023-07-07 11:51:56,241 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 4500, best=0.77, avg=0.76, std=0.00, steps=7.374e+07
2023-07-07 11:52:11,320 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 4600, best=0.77, avg=0.76, std=0.00, steps=7.538e+07
2023-07-07 11:52:26,357 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 4700, best=0.77, avg=0.76, std=0.00, steps=7.702e+07
2023-07-07 11:52:41,363 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 4800, best=0.77, avg=0.76, std=0.00, steps=7.866e+07
2023-07-07 11:52:56,372 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 4900, best=0.77, avg=0.76, std=0.00, steps=8.030e+07
2023-07-07 11:53:11,412 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 5000, best=0.77, avg=0.76, std=0.00, steps=8.194e+07
2023-07-07 11:53:26,451 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 5100, best=0.78, avg=0.77, std=0.00, steps=8.357e+07
2023-07-07 11:53:41,475 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 5200, best=0.77, avg=0.77, std=0.00, steps=8.521e+07
2023-07-07 11:53:56,472 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 5300, best=0.78, avg=0.77, std=0.00, steps=8.685e+07
2023-07-07 11:54:11,493 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 5400, best=0.78, avg=0.77, std=0.00, steps=8.849e+07
2023-07-07 11:54:26,463 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 5500, best=0.78, avg=0.77, std=0.00, steps=9.013e+07
2023-07-07 11:54:41,489 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 5600, best=0.78, avg=0.77, std=0.00, steps=9.177e+07
2023-07-07 11:54:56,474 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 5700, best=0.78, avg=0.77, std=0.00, steps=9.341e+07
2023-07-07 11:55:11,513 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 5800, best=0.78, avg=0.77, std=0.00, steps=9.504e+07
2023-07-07 11:55:26,498 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 5900, best=0.78, avg=0.77, std=0.00, steps=9.668e+07
2023-07-07 11:55:41,478 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 6000, best=0.78, avg=0.78, std=0.00, steps=9.832e+07
2023-07-07 11:55:56,466 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 6100, best=0.78, avg=0.78, std=0.00, steps=9.996e+07
2023-07-07 11:56:11,482 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 6200, best=0.79, avg=0.78, std=0.00, steps=1.016e+08
2023-07-07 11:56:26,533 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 6300, best=0.79, avg=0.78, std=0.00, steps=1.032e+08
2023-07-07 11:56:41,529 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 6400, best=0.78, avg=0.78, std=0.00, steps=1.049e+08
2023-07-07 11:56:56,516 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 6500, best=0.78, avg=0.78, std=0.00, steps=1.065e+08
2023-07-07 11:57:11,541 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 6600, best=0.79, avg=0.78, std=0.00, steps=1.082e+08
2023-07-07 11:57:26,547 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 6700, best=0.79, avg=0.78, std=0.00, steps=1.098e+08
2023-07-07 11:57:41,594 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 6800, best=0.79, avg=0.78, std=0.00, steps=1.114e+08
2023-07-07 11:57:56,646 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 6900, best=0.79, avg=0.78, std=0.00, steps=1.131e+08
2023-07-07 11:58:11,654 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 7000, best=0.79, avg=0.78, std=0.00, steps=1.147e+08
2023-07-07 11:58:26,633 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 7100, best=0.79, avg=0.78, std=0.00, steps=1.163e+08
2023-07-07 11:58:41,692 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 7200, best=0.79, avg=0.78, std=0.00, steps=1.180e+08
2023-07-07 11:58:56,706 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 7300, best=0.79, avg=0.78, std=0.00, steps=1.196e+08
2023-07-07 11:59:11,759 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 7400, best=0.79, avg=0.79, std=0.00, steps=1.213e+08
2023-07-07 11:59:26,813 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 7500, best=0.79, avg=0.79, std=0.00, steps=1.229e+08
2023-07-07 11:59:41,901 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 7600, best=0.79, avg=0.79, std=0.00, steps=1.245e+08
2023-07-07 11:59:56,967 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 7700, best=0.79, avg=0.79, std=0.00, steps=1.262e+08
2023-07-07 12:00:11,960 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 7800, best=0.80, avg=0.79, std=0.00, steps=1.278e+08
2023-07-07 12:00:27,009 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 7900, best=0.80, avg=0.79, std=0.00, steps=1.294e+08
2023-07-07 12:00:41,979 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 8000, best=0.80, avg=0.79, std=0.00, steps=1.311e+08
2023-07-07 12:00:56,976 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 8100, best=0.80, avg=0.79, std=0.00, steps=1.327e+08
2023-07-07 12:01:12,019 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 8200, best=0.80, avg=0.79, std=0.00, steps=1.344e+08
2023-07-07 12:01:27,044 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 8300, best=0.80, avg=0.79, std=0.00, steps=1.360e+08
2023-07-07 12:01:42,066 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 8400, best=0.80, avg=0.79, std=0.00, steps=1.376e+08
2023-07-07 12:01:57,046 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 8500, best=0.80, avg=0.79, std=0.00, steps=1.393e+08
2023-07-07 12:02:12,038 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 8600, best=0.80, avg=0.79, std=0.00, steps=1.409e+08
2023-07-07 12:02:27,005 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 8700, best=0.80, avg=0.79, std=0.00, steps=1.426e+08
2023-07-07 12:02:41,990 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 8800, best=0.80, avg=0.79, std=0.00, steps=1.442e+08
2023-07-07 12:02:56,999 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 8900, best=0.80, avg=0.79, std=0.00, steps=1.458e+08
2023-07-07 12:03:12,028 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 9000, best=0.80, avg=0.79, std=0.00, steps=1.475e+08
2023-07-07 12:03:27,032 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 9100, best=0.80, avg=0.79, std=0.00, steps=1.491e+08
2023-07-07 12:03:42,064 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 9200, best=0.80, avg=0.79, std=0.00, steps=1.507e+08
2023-07-07 12:03:57,122 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 9300, best=0.80, avg=0.80, std=0.00, steps=1.524e+08
2023-07-07 12:04:12,155 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 9400, best=0.80, avg=0.80, std=0.00, steps=1.540e+08
2023-07-07 12:04:27,202 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 9500, best=0.80, avg=0.80, std=0.00, steps=1.557e+08
2023-07-07 12:04:42,236 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 9600, best=0.80, avg=0.80, std=0.00, steps=1.573e+08
2023-07-07 12:04:57,305 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 9700, best=0.80, avg=0.80, std=0.00, steps=1.589e+08
2023-07-07 12:05:12,358 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 9800, best=0.80, avg=0.80, std=0.00, steps=1.606e+08
2023-07-07 12:05:27,373 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 9900, best=0.80, avg=0.80, std=0.00, steps=1.622e+08
2023-07-07 12:05:42,375 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 10000, best=0.80, avg=0.80, std=0.00, steps=1.639e+08
2023-07-07 12:05:57,423 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 10100, best=0.81, avg=0.80, std=0.00, steps=1.655e+08
2023-07-07 12:06:12,453 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 10200, best=0.81, avg=0.80, std=0.00, steps=1.671e+08
2023-07-07 12:06:27,458 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 10300, best=0.81, avg=0.80, std=0.00, steps=1.688e+08
2023-07-07 12:06:42,475 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 10400, best=0.81, avg=0.80, std=0.00, steps=1.704e+08
2023-07-07 12:06:57,481 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 10500, best=0.81, avg=0.80, std=0.00, steps=1.720e+08
2023-07-07 12:07:12,506 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 10600, best=0.81, avg=0.80, std=0.00, steps=1.737e+08
2023-07-07 12:07:27,554 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 10700, best=0.81, avg=0.80, std=0.00, steps=1.753e+08
2023-07-07 12:07:42,534 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 10800, best=0.81, avg=0.80, std=0.00, steps=1.770e+08
2023-07-07 12:07:57,548 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 10900, best=0.81, avg=0.80, std=0.00, steps=1.786e+08
2023-07-07 12:08:12,559 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 11000, best=0.81, avg=0.80, std=0.00, steps=1.802e+08
2023-07-07 12:08:27,540 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 11100, best=0.81, avg=0.80, std=0.00, steps=1.819e+08
2023-07-07 12:08:42,593 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 11200, best=0.81, avg=0.80, std=0.00, steps=1.835e+08
2023-07-07 12:08:57,586 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 11300, best=0.81, avg=0.80, std=0.00, steps=1.852e+08
2023-07-07 12:09:12,632 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 11400, best=0.81, avg=0.81, std=0.00, steps=1.868e+08
2023-07-07 12:09:27,677 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 11500, best=0.81, avg=0.80, std=0.00, steps=1.884e+08
2023-07-07 12:09:42,731 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 11600, best=0.81, avg=0.80, std=0.00, steps=1.901e+08
2023-07-07 12:09:57,789 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 11700, best=0.81, avg=0.81, std=0.00, steps=1.917e+08
2023-07-07 12:10:12,849 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 11800, best=0.81, avg=0.81, std=0.00, steps=1.933e+08
2023-07-07 12:10:27,915 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 11900, best=0.81, avg=0.81, std=0.00, steps=1.950e+08
2023-07-07 12:10:42,817 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 0, 1, [Train]: 11999, best=0.81, avg=0.81, std=0.00, steps=1.966e+08
2023-07-07 12:10:42,817 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 12:10:42,842 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 12:10:42,874 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 12:11:01,597 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 100, best=0.52, avg=0.51, std=0.00, steps=1.862e+06
2023-07-07 12:11:18,484 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 200, best=0.60, avg=0.60, std=0.00, steps=3.705e+06
2023-07-07 12:11:35,340 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 300, best=0.62, avg=0.62, std=0.00, steps=5.548e+06
2023-07-07 12:11:52,185 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 400, best=0.64, avg=0.63, std=0.00, steps=7.391e+06
2023-07-07 12:12:09,108 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 500, best=0.65, avg=0.64, std=0.00, steps=9.234e+06
2023-07-07 12:12:26,015 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 600, best=0.66, avg=0.65, std=0.00, steps=1.108e+07
2023-07-07 12:12:42,881 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 700, best=0.67, avg=0.66, std=0.00, steps=1.292e+07
2023-07-07 12:12:59,802 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 800, best=0.67, avg=0.66, std=0.00, steps=1.476e+07
2023-07-07 12:13:16,680 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 900, best=0.68, avg=0.67, std=0.00, steps=1.661e+07
2023-07-07 12:13:33,591 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 1000, best=0.68, avg=0.67, std=0.00, steps=1.845e+07
2023-07-07 12:13:50,485 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 1100, best=0.68, avg=0.68, std=0.00, steps=2.029e+07
2023-07-07 12:14:07,375 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 1200, best=0.68, avg=0.68, std=0.00, steps=2.214e+07
2023-07-07 12:14:24,270 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 1300, best=0.69, avg=0.68, std=0.00, steps=2.398e+07
2023-07-07 12:14:41,192 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 1400, best=0.69, avg=0.68, std=0.00, steps=2.582e+07
2023-07-07 12:14:58,103 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 1500, best=0.69, avg=0.68, std=0.00, steps=2.767e+07
2023-07-07 12:15:15,052 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 1600, best=0.69, avg=0.69, std=0.00, steps=2.951e+07
2023-07-07 12:15:32,011 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 1700, best=0.69, avg=0.69, std=0.00, steps=3.135e+07
2023-07-07 12:15:48,920 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 1800, best=0.70, avg=0.69, std=0.00, steps=3.320e+07
2023-07-07 12:16:05,835 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 1900, best=0.70, avg=0.69, std=0.00, steps=3.504e+07
2023-07-07 12:16:22,744 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 2000, best=0.70, avg=0.69, std=0.00, steps=3.688e+07
2023-07-07 12:16:39,646 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 2100, best=0.70, avg=0.69, std=0.00, steps=3.873e+07
2023-07-07 12:16:56,521 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 2200, best=0.70, avg=0.69, std=0.00, steps=4.057e+07
2023-07-07 12:17:13,416 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 2300, best=0.71, avg=0.70, std=0.00, steps=4.241e+07
2023-07-07 12:17:30,323 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 2400, best=0.70, avg=0.70, std=0.00, steps=4.426e+07
2023-07-07 12:17:47,191 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 2500, best=0.71, avg=0.70, std=0.00, steps=4.610e+07
2023-07-07 12:18:04,070 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 2600, best=0.71, avg=0.70, std=0.00, steps=4.794e+07
2023-07-07 12:18:20,941 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 2700, best=0.71, avg=0.70, std=0.00, steps=4.978e+07
2023-07-07 12:18:37,845 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 2800, best=0.71, avg=0.70, std=0.00, steps=5.163e+07
2023-07-07 12:18:54,749 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 2900, best=0.71, avg=0.70, std=0.00, steps=5.347e+07
2023-07-07 12:19:11,605 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 3000, best=0.71, avg=0.70, std=0.00, steps=5.531e+07
2023-07-07 12:19:28,506 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 3100, best=0.71, avg=0.71, std=0.00, steps=5.716e+07
2023-07-07 12:19:45,381 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 3200, best=0.71, avg=0.71, std=0.00, steps=5.900e+07
2023-07-07 12:20:02,210 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 3300, best=0.71, avg=0.71, std=0.00, steps=6.084e+07
2023-07-07 12:20:19,051 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 3400, best=0.72, avg=0.71, std=0.00, steps=6.269e+07
2023-07-07 12:20:35,854 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 3500, best=0.72, avg=0.71, std=0.00, steps=6.453e+07
2023-07-07 12:20:52,665 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 3600, best=0.72, avg=0.71, std=0.00, steps=6.637e+07
2023-07-07 12:21:09,486 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 3700, best=0.72, avg=0.71, std=0.00, steps=6.822e+07
2023-07-07 12:21:26,390 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 3800, best=0.72, avg=0.71, std=0.00, steps=7.006e+07
2023-07-07 12:21:43,296 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 3900, best=0.72, avg=0.71, std=0.00, steps=7.190e+07
2023-07-07 12:22:00,133 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 4000, best=0.72, avg=0.71, std=0.00, steps=7.375e+07
2023-07-07 12:22:17,066 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 4100, best=0.72, avg=0.71, std=0.00, steps=7.559e+07
2023-07-07 12:22:33,998 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 4200, best=0.72, avg=0.71, std=0.00, steps=7.743e+07
2023-07-07 12:22:50,844 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 4300, best=0.72, avg=0.72, std=0.00, steps=7.928e+07
2023-07-07 12:23:07,721 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 4400, best=0.72, avg=0.72, std=0.00, steps=8.112e+07
2023-07-07 12:23:24,605 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 4500, best=0.72, avg=0.72, std=0.00, steps=8.296e+07
2023-07-07 12:23:41,706 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 4600, best=0.72, avg=0.72, std=0.00, steps=8.481e+07
2023-07-07 12:23:59,003 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 4700, best=0.72, avg=0.72, std=0.00, steps=8.665e+07
2023-07-07 12:24:15,930 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 4800, best=0.72, avg=0.72, std=0.00, steps=8.849e+07
2023-07-07 12:24:32,760 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 4900, best=0.73, avg=0.72, std=0.00, steps=9.034e+07
2023-07-07 12:24:49,749 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 5000, best=0.73, avg=0.72, std=0.00, steps=9.218e+07
2023-07-07 12:25:06,617 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 5100, best=0.73, avg=0.72, std=0.00, steps=9.402e+07
2023-07-07 12:25:23,457 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 5200, best=0.73, avg=0.72, std=0.00, steps=9.586e+07
2023-07-07 12:25:40,266 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 5300, best=0.73, avg=0.72, std=0.00, steps=9.771e+07
2023-07-07 12:25:57,073 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 5400, best=0.73, avg=0.72, std=0.00, steps=9.955e+07
2023-07-07 12:26:13,969 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 5500, best=0.73, avg=0.72, std=0.00, steps=1.014e+08
2023-07-07 12:26:30,886 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 5600, best=0.73, avg=0.72, std=0.00, steps=1.032e+08
2023-07-07 12:26:47,774 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 5700, best=0.73, avg=0.72, std=0.00, steps=1.051e+08
2023-07-07 12:27:04,592 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 5800, best=0.73, avg=0.72, std=0.00, steps=1.069e+08
2023-07-07 12:27:21,444 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 5900, best=0.73, avg=0.72, std=0.00, steps=1.088e+08
2023-07-07 12:27:38,276 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 6000, best=0.73, avg=0.72, std=0.00, steps=1.106e+08
2023-07-07 12:27:55,246 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 6100, best=0.73, avg=0.72, std=0.00, steps=1.125e+08
2023-07-07 12:28:12,162 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 6200, best=0.74, avg=0.73, std=0.00, steps=1.143e+08
2023-07-07 12:28:29,060 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 6300, best=0.73, avg=0.73, std=0.00, steps=1.161e+08
2023-07-07 12:28:45,935 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 6400, best=0.73, avg=0.73, std=0.00, steps=1.180e+08
2023-07-07 12:29:02,787 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 6500, best=0.73, avg=0.73, std=0.00, steps=1.198e+08
2023-07-07 12:29:19,662 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 6600, best=0.73, avg=0.73, std=0.00, steps=1.217e+08
2023-07-07 12:29:36,573 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 6700, best=0.73, avg=0.73, std=0.00, steps=1.235e+08
2023-07-07 12:29:53,495 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 6800, best=0.74, avg=0.73, std=0.00, steps=1.254e+08
2023-07-07 12:30:10,375 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 6900, best=0.74, avg=0.73, std=0.00, steps=1.272e+08
2023-07-07 12:30:27,290 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 7000, best=0.74, avg=0.73, std=0.00, steps=1.290e+08
2023-07-07 12:30:44,200 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 7100, best=0.74, avg=0.73, std=0.00, steps=1.309e+08
2023-07-07 12:31:01,096 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 7200, best=0.74, avg=0.73, std=0.00, steps=1.327e+08
2023-07-07 12:31:17,986 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 7300, best=0.74, avg=0.73, std=0.00, steps=1.346e+08
2023-07-07 12:31:34,806 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 7400, best=0.74, avg=0.73, std=0.00, steps=1.364e+08
2023-07-07 12:31:51,693 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 7500, best=0.74, avg=0.73, std=0.00, steps=1.383e+08
2023-07-07 12:32:08,557 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 7600, best=0.74, avg=0.73, std=0.00, steps=1.401e+08
2023-07-07 12:32:25,454 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 7700, best=0.74, avg=0.73, std=0.00, steps=1.419e+08
2023-07-07 12:32:42,313 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 7800, best=0.74, avg=0.73, std=0.00, steps=1.438e+08
2023-07-07 12:32:59,135 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 7900, best=0.74, avg=0.73, std=0.00, steps=1.456e+08
2023-07-07 12:33:16,019 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 8000, best=0.74, avg=0.73, std=0.00, steps=1.475e+08
2023-07-07 12:33:32,942 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 8100, best=0.74, avg=0.73, std=0.00, steps=1.493e+08
2023-07-07 12:33:49,859 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 8200, best=0.74, avg=0.73, std=0.00, steps=1.512e+08
2023-07-07 12:34:06,772 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 8300, best=0.74, avg=0.73, std=0.00, steps=1.530e+08
2023-07-07 12:34:23,591 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 8400, best=0.74, avg=0.73, std=0.00, steps=1.548e+08
2023-07-07 12:34:40,456 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 8500, best=0.74, avg=0.74, std=0.00, steps=1.567e+08
2023-07-07 12:34:57,403 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 8600, best=0.74, avg=0.74, std=0.00, steps=1.585e+08
2023-07-07 12:35:14,285 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 8700, best=0.74, avg=0.74, std=0.00, steps=1.604e+08
2023-07-07 12:35:31,143 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 8800, best=0.74, avg=0.74, std=0.00, steps=1.622e+08
2023-07-07 12:35:48,009 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 8900, best=0.75, avg=0.74, std=0.00, steps=1.641e+08
2023-07-07 12:36:04,868 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 9000, best=0.74, avg=0.74, std=0.00, steps=1.659e+08
2023-07-07 12:36:21,772 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 9100, best=0.74, avg=0.74, std=0.00, steps=1.677e+08
2023-07-07 12:36:38,707 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 9200, best=0.75, avg=0.74, std=0.00, steps=1.696e+08
2023-07-07 12:36:55,637 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 9300, best=0.75, avg=0.74, std=0.00, steps=1.714e+08
2023-07-07 12:37:12,568 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 9400, best=0.75, avg=0.74, std=0.00, steps=1.733e+08
2023-07-07 12:37:29,463 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 9500, best=0.74, avg=0.74, std=0.00, steps=1.751e+08
2023-07-07 12:37:46,298 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 9600, best=0.75, avg=0.74, std=0.00, steps=1.770e+08
2023-07-07 12:38:03,161 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 9700, best=0.75, avg=0.74, std=0.00, steps=1.788e+08
2023-07-07 12:38:20,067 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 9800, best=0.75, avg=0.74, std=0.00, steps=1.807e+08
2023-07-07 12:38:37,009 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 9900, best=0.75, avg=0.74, std=0.00, steps=1.825e+08
2023-07-07 12:38:53,887 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 10000, best=0.75, avg=0.74, std=0.00, steps=1.843e+08
2023-07-07 12:39:10,780 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 10100, best=0.75, avg=0.74, std=0.00, steps=1.862e+08
2023-07-07 12:39:27,614 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 10200, best=0.75, avg=0.74, std=0.00, steps=1.880e+08
2023-07-07 12:39:44,476 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 10300, best=0.75, avg=0.74, std=0.00, steps=1.899e+08
2023-07-07 12:40:01,336 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 10400, best=0.75, avg=0.74, std=0.00, steps=1.917e+08
2023-07-07 12:40:18,214 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 10500, best=0.75, avg=0.74, std=0.00, steps=1.936e+08
2023-07-07 12:40:35,097 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 10600, best=0.75, avg=0.74, std=0.00, steps=1.954e+08
2023-07-07 12:40:52,045 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 10700, best=0.75, avg=0.74, std=0.00, steps=1.972e+08
2023-07-07 12:41:08,935 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 10800, best=0.75, avg=0.74, std=0.00, steps=1.991e+08
2023-07-07 12:41:25,788 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 10900, best=0.75, avg=0.74, std=0.00, steps=2.009e+08
2023-07-07 12:41:42,628 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 11000, best=0.75, avg=0.74, std=0.00, steps=2.028e+08
2023-07-07 12:41:59,569 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 11100, best=0.75, avg=0.74, std=0.00, steps=2.046e+08
2023-07-07 12:42:16,501 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 11200, best=0.75, avg=0.74, std=0.00, steps=2.065e+08
2023-07-07 12:42:33,413 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 11300, best=0.75, avg=0.74, std=0.00, steps=2.083e+08
2023-07-07 12:42:50,280 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 11400, best=0.75, avg=0.75, std=0.00, steps=2.101e+08
2023-07-07 12:43:07,160 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 11500, best=0.75, avg=0.75, std=0.00, steps=2.120e+08
2023-07-07 12:43:24,065 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 11600, best=0.75, avg=0.75, std=0.00, steps=2.138e+08
2023-07-07 12:43:40,989 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 11700, best=0.75, avg=0.75, std=0.00, steps=2.157e+08
2023-07-07 12:43:57,855 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 11800, best=0.76, avg=0.75, std=0.00, steps=2.175e+08
2023-07-07 12:44:14,752 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 11900, best=0.75, avg=0.75, std=0.00, steps=2.194e+08
2023-07-07 12:44:31,543 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 8, 1, [Train]: 11999, best=0.75, avg=0.75, std=0.00, steps=2.212e+08
2023-07-07 12:44:31,544 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 12:44:31,567 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 12:44:31,598 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 12:44:52,196 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 100, best=0.51, avg=0.50, std=0.00, steps=2.068e+06
2023-07-07 12:45:10,860 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 200, best=0.51, avg=0.50, std=0.00, steps=4.116e+06
2023-07-07 12:45:29,566 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 300, best=0.51, avg=0.50, std=0.00, steps=6.164e+06
2023-07-07 12:45:48,212 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 400, best=0.51, avg=0.50, std=0.00, steps=8.212e+06
2023-07-07 12:46:06,884 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 500, best=0.51, avg=0.50, std=0.00, steps=1.026e+07
2023-07-07 12:46:25,564 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 600, best=0.51, avg=0.50, std=0.00, steps=1.231e+07
2023-07-07 12:46:44,228 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 700, best=0.51, avg=0.50, std=0.00, steps=1.436e+07
2023-07-07 12:47:02,904 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 800, best=0.51, avg=0.50, std=0.00, steps=1.640e+07
2023-07-07 12:47:21,612 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 900, best=0.51, avg=0.50, std=0.00, steps=1.845e+07
2023-07-07 12:47:40,295 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 1000, best=0.51, avg=0.50, std=0.00, steps=2.050e+07
2023-07-07 12:47:59,038 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 1100, best=0.51, avg=0.50, std=0.00, steps=2.255e+07
2023-07-07 12:48:17,755 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 1200, best=0.51, avg=0.50, std=0.00, steps=2.460e+07
2023-07-07 12:48:36,494 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 1300, best=0.51, avg=0.50, std=0.00, steps=2.664e+07
2023-07-07 12:48:55,207 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 1400, best=0.51, avg=0.50, std=0.00, steps=2.869e+07
2023-07-07 12:49:14,019 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 1500, best=0.51, avg=0.50, std=0.00, steps=3.074e+07
2023-07-07 12:49:32,720 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 1600, best=0.51, avg=0.50, std=0.00, steps=3.279e+07
2023-07-07 12:49:51,375 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 1700, best=0.51, avg=0.50, std=0.00, steps=3.484e+07
2023-07-07 12:50:10,100 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 1800, best=0.51, avg=0.50, std=0.00, steps=3.688e+07
2023-07-07 12:50:28,914 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 1900, best=0.51, avg=0.50, std=0.00, steps=3.893e+07
2023-07-07 12:50:47,623 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 2000, best=0.51, avg=0.50, std=0.00, steps=4.098e+07
2023-07-07 12:51:06,283 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 2100, best=0.51, avg=0.50, std=0.00, steps=4.303e+07
2023-07-07 12:51:24,976 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 2200, best=0.51, avg=0.50, std=0.00, steps=4.508e+07
2023-07-07 12:51:43,715 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 2300, best=0.51, avg=0.50, std=0.00, steps=4.712e+07
2023-07-07 12:52:02,470 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 2400, best=0.51, avg=0.50, std=0.00, steps=4.917e+07
2023-07-07 12:52:21,206 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 2500, best=0.51, avg=0.50, std=0.00, steps=5.122e+07
2023-07-07 12:52:39,783 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 2600, best=0.51, avg=0.50, std=0.00, steps=5.327e+07
2023-07-07 12:52:58,449 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 2700, best=0.51, avg=0.50, std=0.00, steps=5.532e+07
2023-07-07 12:53:17,051 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 2800, best=0.51, avg=0.50, std=0.00, steps=5.736e+07
2023-07-07 12:53:35,649 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 2900, best=0.51, avg=0.50, std=0.00, steps=5.941e+07
2023-07-07 12:53:54,240 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 3000, best=0.51, avg=0.50, std=0.00, steps=6.146e+07
2023-07-07 12:54:12,976 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 3100, best=0.51, avg=0.50, std=0.00, steps=6.351e+07
2023-07-07 12:54:31,633 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 3200, best=0.51, avg=0.50, std=0.00, steps=6.556e+07
2023-07-07 12:54:50,346 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 3300, best=0.51, avg=0.50, std=0.00, steps=6.760e+07
2023-07-07 12:55:08,992 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 3400, best=0.51, avg=0.50, std=0.00, steps=6.965e+07
2023-07-07 12:55:27,580 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 3500, best=0.51, avg=0.50, std=0.00, steps=7.170e+07
2023-07-07 12:55:46,293 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 3600, best=0.51, avg=0.50, std=0.00, steps=7.375e+07
2023-07-07 12:56:04,978 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 3700, best=0.51, avg=0.50, std=0.00, steps=7.580e+07
2023-07-07 12:56:23,658 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 3800, best=0.51, avg=0.50, std=0.00, steps=7.784e+07
2023-07-07 12:56:42,295 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 3900, best=0.51, avg=0.50, std=0.00, steps=7.989e+07
2023-07-07 12:57:00,933 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 4000, best=0.51, avg=0.50, std=0.00, steps=8.194e+07
2023-07-07 12:57:19,539 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 4100, best=0.51, avg=0.50, std=0.00, steps=8.399e+07
2023-07-07 12:57:38,189 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 4200, best=0.52, avg=0.50, std=0.00, steps=8.604e+07
2023-07-07 12:57:56,815 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 4300, best=0.51, avg=0.50, std=0.00, steps=8.808e+07
2023-07-07 12:58:15,429 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 4400, best=0.51, avg=0.50, std=0.00, steps=9.013e+07
2023-07-07 12:58:34,138 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 4500, best=0.51, avg=0.50, std=0.00, steps=9.218e+07
2023-07-07 12:58:52,726 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 4600, best=0.52, avg=0.50, std=0.00, steps=9.423e+07
2023-07-07 12:59:11,425 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 4700, best=0.51, avg=0.50, std=0.00, steps=9.628e+07
2023-07-07 12:59:30,104 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 4800, best=0.52, avg=0.50, std=0.00, steps=9.832e+07
2023-07-07 12:59:48,748 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 4900, best=0.51, avg=0.50, std=0.00, steps=1.004e+08
2023-07-07 13:00:07,360 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 5000, best=0.51, avg=0.50, std=0.00, steps=1.024e+08
2023-07-07 13:00:25,978 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 5100, best=0.51, avg=0.50, std=0.00, steps=1.045e+08
2023-07-07 13:00:44,600 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 5200, best=0.51, avg=0.50, std=0.00, steps=1.065e+08
2023-07-07 13:01:03,222 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 5300, best=0.51, avg=0.50, std=0.00, steps=1.086e+08
2023-07-07 13:01:21,897 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 5400, best=0.52, avg=0.50, std=0.00, steps=1.106e+08
2023-07-07 13:01:40,560 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 5500, best=0.51, avg=0.50, std=0.00, steps=1.127e+08
2023-07-07 13:01:59,302 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 5600, best=0.51, avg=0.50, std=0.00, steps=1.147e+08
2023-07-07 13:02:17,986 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 5700, best=0.51, avg=0.50, std=0.00, steps=1.168e+08
2023-07-07 13:02:36,598 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 5800, best=0.51, avg=0.50, std=0.00, steps=1.188e+08
2023-07-07 13:02:55,232 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 5900, best=0.51, avg=0.50, std=0.00, steps=1.209e+08
2023-07-07 13:03:13,910 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 6000, best=0.51, avg=0.50, std=0.00, steps=1.229e+08
2023-07-07 13:03:32,550 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 6100, best=0.51, avg=0.50, std=0.00, steps=1.249e+08
2023-07-07 13:03:51,237 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 6200, best=0.51, avg=0.50, std=0.00, steps=1.270e+08
2023-07-07 13:04:09,881 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 6300, best=0.51, avg=0.50, std=0.00, steps=1.290e+08
2023-07-07 13:04:28,468 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 6400, best=0.51, avg=0.50, std=0.00, steps=1.311e+08
2023-07-07 13:04:47,143 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 6500, best=0.51, avg=0.50, std=0.00, steps=1.331e+08
2023-07-07 13:05:05,864 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 6600, best=0.51, avg=0.50, std=0.00, steps=1.352e+08
2023-07-07 13:05:24,549 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 6700, best=0.51, avg=0.50, std=0.00, steps=1.372e+08
2023-07-07 13:05:43,176 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 6800, best=0.51, avg=0.50, std=0.00, steps=1.393e+08
2023-07-07 13:06:01,753 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 6900, best=0.51, avg=0.50, std=0.00, steps=1.413e+08
2023-07-07 13:06:20,396 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 7000, best=0.51, avg=0.50, std=0.00, steps=1.434e+08
2023-07-07 13:06:39,008 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 7100, best=0.51, avg=0.50, std=0.00, steps=1.454e+08
2023-07-07 13:06:57,677 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 7200, best=0.51, avg=0.50, std=0.00, steps=1.475e+08
2023-07-07 13:07:16,311 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 7300, best=0.51, avg=0.50, std=0.00, steps=1.495e+08
2023-07-07 13:07:34,942 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 7400, best=0.51, avg=0.50, std=0.00, steps=1.516e+08
2023-07-07 13:07:53,579 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 7500, best=0.51, avg=0.50, std=0.00, steps=1.536e+08
2023-07-07 13:08:12,282 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 7600, best=0.51, avg=0.50, std=0.00, steps=1.557e+08
2023-07-07 13:08:30,913 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 7700, best=0.51, avg=0.50, std=0.00, steps=1.577e+08
2023-07-07 13:08:49,630 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 7800, best=0.51, avg=0.50, std=0.00, steps=1.598e+08
2023-07-07 13:09:08,348 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 7900, best=0.51, avg=0.50, std=0.00, steps=1.618e+08
2023-07-07 13:09:27,027 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 8000, best=0.51, avg=0.50, std=0.00, steps=1.639e+08
2023-07-07 13:09:45,611 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 8100, best=0.51, avg=0.50, std=0.00, steps=1.659e+08
2023-07-07 13:10:04,225 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 8200, best=0.51, avg=0.50, std=0.00, steps=1.680e+08
2023-07-07 13:10:22,897 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 8300, best=0.51, avg=0.50, std=0.00, steps=1.700e+08
2023-07-07 13:10:41,630 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 8400, best=0.51, avg=0.50, std=0.00, steps=1.721e+08
2023-07-07 13:11:00,332 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 8500, best=0.51, avg=0.50, std=0.00, steps=1.741e+08
2023-07-07 13:11:18,943 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 8600, best=0.51, avg=0.50, std=0.00, steps=1.761e+08
2023-07-07 13:11:37,554 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 8700, best=0.51, avg=0.50, std=0.00, steps=1.782e+08
2023-07-07 13:11:56,165 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 8800, best=0.51, avg=0.50, std=0.00, steps=1.802e+08
2023-07-07 13:12:14,782 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 8900, best=0.51, avg=0.50, std=0.00, steps=1.823e+08
2023-07-07 13:12:33,417 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 9000, best=0.51, avg=0.50, std=0.00, steps=1.843e+08
2023-07-07 13:12:52,024 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 9100, best=0.51, avg=0.50, std=0.00, steps=1.864e+08
2023-07-07 13:13:10,719 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 9200, best=0.51, avg=0.50, std=0.00, steps=1.884e+08
2023-07-07 13:13:29,441 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 9300, best=0.51, avg=0.50, std=0.00, steps=1.905e+08
2023-07-07 13:13:48,041 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 9400, best=0.51, avg=0.50, std=0.00, steps=1.925e+08
2023-07-07 13:14:06,637 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 9500, best=0.51, avg=0.50, std=0.00, steps=1.946e+08
2023-07-07 13:14:25,307 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 9600, best=0.51, avg=0.50, std=0.00, steps=1.966e+08
2023-07-07 13:14:44,017 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 9700, best=0.51, avg=0.50, std=0.00, steps=1.987e+08
2023-07-07 13:15:02,600 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 9800, best=0.51, avg=0.50, std=0.00, steps=2.007e+08
2023-07-07 13:15:21,292 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 9900, best=0.51, avg=0.50, std=0.00, steps=2.028e+08
2023-07-07 13:15:40,029 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 10000, best=0.51, avg=0.50, std=0.00, steps=2.048e+08
2023-07-07 13:15:58,676 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 10100, best=0.51, avg=0.50, std=0.00, steps=2.069e+08
2023-07-07 13:16:17,357 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 10200, best=0.51, avg=0.50, std=0.00, steps=2.089e+08
2023-07-07 13:16:35,961 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 10300, best=0.51, avg=0.50, std=0.00, steps=2.110e+08
2023-07-07 13:16:54,586 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 10400, best=0.51, avg=0.50, std=0.00, steps=2.130e+08
2023-07-07 13:17:13,239 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 10500, best=0.51, avg=0.50, std=0.00, steps=2.151e+08
2023-07-07 13:17:31,880 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 10600, best=0.51, avg=0.50, std=0.00, steps=2.171e+08
2023-07-07 13:17:50,445 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 10700, best=0.51, avg=0.50, std=0.00, steps=2.192e+08
2023-07-07 13:18:09,137 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 10800, best=0.51, avg=0.50, std=0.00, steps=2.212e+08
2023-07-07 13:18:27,775 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 10900, best=0.51, avg=0.50, std=0.00, steps=2.233e+08
2023-07-07 13:18:46,406 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 11000, best=0.51, avg=0.50, std=0.00, steps=2.253e+08
2023-07-07 13:19:05,199 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 11100, best=0.51, avg=0.50, std=0.00, steps=2.273e+08
2023-07-07 13:19:23,959 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 11200, best=0.51, avg=0.50, std=0.00, steps=2.294e+08
2023-07-07 13:19:42,747 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 11300, best=0.51, avg=0.50, std=0.00, steps=2.314e+08
2023-07-07 13:20:01,405 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 11400, best=0.51, avg=0.50, std=0.00, steps=2.335e+08
2023-07-07 13:20:20,047 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 11500, best=0.51, avg=0.50, std=0.00, steps=2.355e+08
2023-07-07 13:20:38,778 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 11600, best=0.51, avg=0.50, std=0.00, steps=2.376e+08
2023-07-07 13:20:57,470 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 11700, best=0.51, avg=0.50, std=0.00, steps=2.396e+08
2023-07-07 13:21:16,225 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 11800, best=0.51, avg=0.50, std=0.00, steps=2.417e+08
2023-07-07 13:21:34,949 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 11900, best=0.51, avg=0.50, std=0.00, steps=2.437e+08
2023-07-07 13:21:53,388 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 16, 1, [Train]: 11999, best=0.51, avg=0.50, std=0.00, steps=2.458e+08
2023-07-07 13:21:53,389 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 13:21:53,413 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 13:21:53,445 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 13:22:17,824 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 100, best=0.51, avg=0.50, std=0.00, steps=2.482e+06
2023-07-07 13:22:40,035 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 200, best=0.51, avg=0.50, std=0.00, steps=4.940e+06
2023-07-07 13:23:02,297 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 300, best=0.51, avg=0.50, std=0.00, steps=7.397e+06
2023-07-07 13:23:24,677 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 400, best=0.56, avg=0.56, std=0.00, steps=9.855e+06
2023-07-07 13:23:46,951 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 500, best=0.58, avg=0.57, std=0.00, steps=1.231e+07
2023-07-07 13:24:09,267 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 600, best=0.59, avg=0.58, std=0.00, steps=1.477e+07
2023-07-07 13:24:31,501 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 700, best=0.60, avg=0.59, std=0.00, steps=1.723e+07
2023-07-07 13:24:53,787 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 800, best=0.60, avg=0.59, std=0.00, steps=1.969e+07
2023-07-07 13:25:16,083 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 900, best=0.61, avg=0.60, std=0.00, steps=2.214e+07
2023-07-07 13:25:38,469 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 1000, best=0.62, avg=0.61, std=0.00, steps=2.460e+07
2023-07-07 13:26:00,719 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 1100, best=0.62, avg=0.61, std=0.00, steps=2.706e+07
2023-07-07 13:26:22,990 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 1200, best=0.62, avg=0.62, std=0.00, steps=2.952e+07
2023-07-07 13:26:45,357 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 1300, best=0.63, avg=0.62, std=0.00, steps=3.197e+07
2023-07-07 13:27:07,690 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 1400, best=0.63, avg=0.63, std=0.00, steps=3.443e+07
2023-07-07 13:27:29,981 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 1500, best=0.64, avg=0.63, std=0.00, steps=3.689e+07
2023-07-07 13:27:52,318 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 1600, best=0.64, avg=0.63, std=0.00, steps=3.935e+07
2023-07-07 13:28:14,606 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 1700, best=0.64, avg=0.63, std=0.00, steps=4.180e+07
2023-07-07 13:28:36,941 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 1800, best=0.64, avg=0.63, std=0.00, steps=4.426e+07
2023-07-07 13:28:59,277 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 1900, best=0.64, avg=0.64, std=0.00, steps=4.672e+07
2023-07-07 13:29:21,621 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 2000, best=0.64, avg=0.64, std=0.00, steps=4.918e+07
2023-07-07 13:29:43,937 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 2100, best=0.64, avg=0.64, std=0.00, steps=5.163e+07
2023-07-07 13:30:06,248 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 2200, best=0.65, avg=0.64, std=0.00, steps=5.409e+07
2023-07-07 13:30:28,528 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 2300, best=0.65, avg=0.64, std=0.00, steps=5.655e+07
2023-07-07 13:30:50,837 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 2400, best=0.65, avg=0.64, std=0.00, steps=5.901e+07
2023-07-07 13:31:13,110 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 2500, best=0.65, avg=0.64, std=0.00, steps=6.146e+07
2023-07-07 13:31:35,405 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 2600, best=0.65, avg=0.64, std=0.00, steps=6.392e+07
2023-07-07 13:31:57,765 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 2700, best=0.65, avg=0.64, std=0.00, steps=6.638e+07
2023-07-07 13:32:20,025 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 2800, best=0.65, avg=0.64, std=0.00, steps=6.884e+07
2023-07-07 13:32:42,308 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 2900, best=0.65, avg=0.64, std=0.00, steps=7.129e+07
2023-07-07 13:33:04,518 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 3000, best=0.65, avg=0.64, std=0.00, steps=7.375e+07
2023-07-07 13:33:26,769 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 3100, best=0.65, avg=0.64, std=0.00, steps=7.621e+07
2023-07-07 13:33:49,112 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 3200, best=0.65, avg=0.65, std=0.00, steps=7.867e+07
2023-07-07 13:34:11,354 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 3300, best=0.65, avg=0.65, std=0.00, steps=8.113e+07
2023-07-07 13:34:33,633 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 3400, best=0.65, avg=0.65, std=0.00, steps=8.358e+07
2023-07-07 13:34:55,914 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 3500, best=0.65, avg=0.65, std=0.00, steps=8.604e+07
2023-07-07 13:35:18,158 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 3600, best=0.65, avg=0.65, std=0.00, steps=8.850e+07
2023-07-07 13:35:40,436 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 3700, best=0.65, avg=0.65, std=0.00, steps=9.096e+07
2023-07-07 13:36:02,888 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 3800, best=0.65, avg=0.65, std=0.00, steps=9.341e+07
2023-07-07 13:36:25,172 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 3900, best=0.65, avg=0.65, std=0.00, steps=9.587e+07
2023-07-07 13:36:47,496 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 4000, best=0.66, avg=0.65, std=0.00, steps=9.833e+07
2023-07-07 13:37:09,832 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 4100, best=0.65, avg=0.65, std=0.00, steps=1.008e+08
2023-07-07 13:37:32,166 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 4200, best=0.66, avg=0.65, std=0.00, steps=1.032e+08
2023-07-07 13:37:54,554 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 4300, best=0.66, avg=0.65, std=0.00, steps=1.057e+08
2023-07-07 13:38:16,840 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 4400, best=0.66, avg=0.65, std=0.00, steps=1.082e+08
2023-07-07 13:38:39,172 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 4500, best=0.66, avg=0.65, std=0.00, steps=1.106e+08
2023-07-07 13:39:01,497 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 4600, best=0.66, avg=0.65, std=0.00, steps=1.131e+08
2023-07-07 13:39:23,829 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 4700, best=0.66, avg=0.65, std=0.00, steps=1.155e+08
2023-07-07 13:39:46,102 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 4800, best=0.66, avg=0.65, std=0.00, steps=1.180e+08
2023-07-07 13:40:08,335 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 4900, best=0.66, avg=0.65, std=0.00, steps=1.204e+08
2023-07-07 13:40:30,605 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 5000, best=0.66, avg=0.65, std=0.00, steps=1.229e+08
2023-07-07 13:40:52,856 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 5100, best=0.66, avg=0.65, std=0.00, steps=1.254e+08
2023-07-07 13:41:15,030 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 5200, best=0.66, avg=0.65, std=0.00, steps=1.278e+08
2023-07-07 13:41:37,334 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 5300, best=0.66, avg=0.65, std=0.00, steps=1.303e+08
2023-07-07 13:41:59,582 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 5400, best=0.66, avg=0.65, std=0.00, steps=1.327e+08
2023-07-07 13:42:21,888 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 5500, best=0.66, avg=0.65, std=0.00, steps=1.352e+08
2023-07-07 13:42:44,145 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 5600, best=0.66, avg=0.65, std=0.00, steps=1.377e+08
2023-07-07 13:43:06,371 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 5700, best=0.66, avg=0.65, std=0.00, steps=1.401e+08
2023-07-07 13:43:28,604 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 5800, best=0.66, avg=0.65, std=0.00, steps=1.426e+08
2023-07-07 13:43:50,875 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 5900, best=0.66, avg=0.65, std=0.00, steps=1.450e+08
2023-07-07 13:44:13,128 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 6000, best=0.66, avg=0.65, std=0.00, steps=1.475e+08
2023-07-07 13:44:35,363 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 6100, best=0.66, avg=0.65, std=0.00, steps=1.499e+08
2023-07-07 13:44:57,568 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 6200, best=0.66, avg=0.66, std=0.00, steps=1.524e+08
2023-07-07 13:45:19,840 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 6300, best=0.66, avg=0.66, std=0.00, steps=1.549e+08
2023-07-07 13:45:42,110 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 6400, best=0.66, avg=0.65, std=0.00, steps=1.573e+08
2023-07-07 13:46:04,359 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 6500, best=0.66, avg=0.66, std=0.00, steps=1.598e+08
2023-07-07 13:46:26,589 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 6600, best=0.66, avg=0.66, std=0.00, steps=1.622e+08
2023-07-07 13:46:48,812 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 6700, best=0.67, avg=0.66, std=0.00, steps=1.647e+08
2023-07-07 13:47:11,023 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 6800, best=0.66, avg=0.66, std=0.00, steps=1.671e+08
2023-07-07 13:47:33,300 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 6900, best=0.66, avg=0.66, std=0.00, steps=1.696e+08
2023-07-07 13:47:55,491 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 7000, best=0.67, avg=0.66, std=0.00, steps=1.721e+08
2023-07-07 13:48:17,832 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 7100, best=0.67, avg=0.66, std=0.00, steps=1.745e+08
2023-07-07 13:48:40,048 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 7200, best=0.67, avg=0.66, std=0.00, steps=1.770e+08
2023-07-07 13:49:02,274 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 7300, best=0.67, avg=0.66, std=0.00, steps=1.794e+08
2023-07-07 13:49:24,513 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 7400, best=0.67, avg=0.66, std=0.00, steps=1.819e+08
2023-07-07 13:49:46,736 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 7500, best=0.67, avg=0.66, std=0.00, steps=1.843e+08
2023-07-07 13:50:09,029 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 7600, best=0.67, avg=0.66, std=0.00, steps=1.868e+08
2023-07-07 13:50:31,227 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 7700, best=0.67, avg=0.66, std=0.00, steps=1.893e+08
2023-07-07 13:50:53,550 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 7800, best=0.67, avg=0.66, std=0.00, steps=1.917e+08
2023-07-07 13:51:15,858 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 7900, best=0.67, avg=0.66, std=0.00, steps=1.942e+08
2023-07-07 13:51:38,144 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 8000, best=0.67, avg=0.66, std=0.00, steps=1.966e+08
2023-07-07 13:52:00,348 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 8100, best=0.67, avg=0.67, std=0.00, steps=1.991e+08
2023-07-07 13:52:22,625 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 8200, best=0.67, avg=0.67, std=0.00, steps=2.015e+08
2023-07-07 13:52:44,871 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 8300, best=0.67, avg=0.67, std=0.00, steps=2.040e+08
2023-07-07 13:53:07,206 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 8400, best=0.67, avg=0.67, std=0.00, steps=2.065e+08
2023-07-07 13:53:29,577 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 8500, best=0.67, avg=0.67, std=0.00, steps=2.089e+08
2023-07-07 13:53:51,875 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 8600, best=0.67, avg=0.67, std=0.00, steps=2.114e+08
2023-07-07 13:54:14,112 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 8700, best=0.67, avg=0.67, std=0.00, steps=2.138e+08
2023-07-07 13:54:36,371 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 8800, best=0.67, avg=0.67, std=0.00, steps=2.163e+08
2023-07-07 13:54:58,641 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 8900, best=0.67, avg=0.67, std=0.00, steps=2.188e+08
2023-07-07 13:55:20,967 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 9000, best=0.67, avg=0.67, std=0.00, steps=2.212e+08
2023-07-07 13:55:43,256 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 9100, best=0.68, avg=0.67, std=0.00, steps=2.237e+08
2023-07-07 13:56:05,526 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 9200, best=0.68, avg=0.67, std=0.00, steps=2.261e+08
2023-07-07 13:56:27,811 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 9300, best=0.68, avg=0.67, std=0.00, steps=2.286e+08
2023-07-07 13:56:50,128 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 9400, best=0.68, avg=0.67, std=0.00, steps=2.310e+08
2023-07-07 13:57:12,398 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 9500, best=0.67, avg=0.67, std=0.00, steps=2.335e+08
2023-07-07 13:57:34,629 -        meta learning: [    INFO] - [Len Lat Rep]: 32, 32, 1, [Train]: 9600, best=0.68, avg=0.67, std=0.00, steps=2.360e+08
2023-07-07 13:57:37,422 -        meta learning: [    INFO] - KeyboardInterrupt, Begin eval_with_injury.
2023-07-07 13:57:37,422 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 13:57:37,423 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 13:57:37,513 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 13:57:37,549 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 13:57:47,854 -        meta learning: [    INFO] - KeyboardInterrupt, Begin eval_with_injury.
2023-07-07 13:57:47,854 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 13:57:47,854 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 13:57:47,955 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 13:57:47,986 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 13:57:49,062 -        meta learning: [    INFO] - KeyboardInterrupt, Begin eval_with_injury.
2023-07-07 13:57:49,062 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 13:57:49,062 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 13:57:49,162 -        meta learning: [    INFO] - [Total Params]: params=53505
2023-07-07 13:57:49,191 -           SimManager: [    INFO] - use_for_loop=False
2023-07-07 13:57:49,387 -        meta learning: [    INFO] - KeyboardInterrupt, Begin eval_with_injury.
2023-07-07 13:57:49,388 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 13:57:49,388 -        meta learning: [    INFO] - [OUTPUT DIR]: /data/anonymous/meta/train/PGPE-BatchedGruMetaStdpMLPPolicy-SeqTask--20230707-000444
2023-07-07 13:57:49,411 -        meta learning: [    INFO] - [Total Params]: params=53505
