action: tensor([[-0.9952, -0.9655, -0.9626,  0.8935,  0.9897,  0.4982],
        [-0.9529, -0.9966, -0.9669, -0.8103,  0.9665,  0.3314],
        [ 0.4424,  0.2325, -0.7148, -0.1693,  0.8153, -0.4666],
        [ 0.9817,  0.6760,  0.9992,  0.1840, -0.9534, -0.1046],
        [ 0.9838,  0.7855,  0.8100,  0.2174, -0.9802, -0.7852],
        [ 0.9658,  0.3667, -0.9223,  0.9075, -0.9399,  0.1530],
        [-0.9982, -0.9712, -0.9573,  0.8343,  0.9489,  0.9477],
        [-0.9358, -0.9859, -0.9657, -0.3485,  0.7070,  0.6502],
        [ 0.5042,  0.8155, -0.8856, -0.3878,  0.3853, -0.4317],
        [ 0.9158, -0.3290,  0.9648,  0.5092, -0.8433,  0.0168],
        [ 0.9362, -0.2846,  0.9048,  0.9617, -0.4950,  0.3404],
        [ 0.9411, -0.9373, -0.9672,  0.9078, -0.8657, -0.9675],
        [-0.9797, -0.6337, -0.9059,  0.7984,  0.9788, -0.7475],
        [-0.9731, -0.9889, -0.9608, -0.9317,  0.9518,  0.4996],
        [ 0.4194,  0.8417, -0.8405, -0.5234, -0.2991, -0.2471],
        [ 0.9701,  0.3364,  0.9577,  0.1409, -0.9378, -0.8648],
        [ 0.9894,  0.6893,  0.6421,  0.3486, -0.9741, -0.9036],
        [ 0.9865,  0.2370, -0.8292,  0.8871, -0.9580,  0.2479],
        [-0.9970, -0.9657, -0.9788,  0.9769,  0.9960,  0.9931],
        [-0.9793, -0.9545, -0.9799,  0.1075,  0.9170,  0.2914]],
       device='cuda:0')
squash tensor([[-3.0145, -2.0206, -1.9795,  1.4391,  2.6334,  0.5469],
        [-1.8629, -3.1834, -2.0420, -1.1278,  2.0358,  0.3444],
        [ 0.4752,  0.2368, -0.8969, -0.1709,  1.1426, -0.5058],
        [ 2.3420,  0.8218,  3.8949,  0.1861, -1.8674, -0.1050],
        [ 2.4052,  1.0595,  1.1271,  0.2209, -2.3038, -1.0589],
        [ 2.0257,  0.3846, -1.6044,  1.5131, -1.7368,  0.1542],
        [-3.5166, -2.1133, -1.9127,  1.2021,  1.8204,  1.8091],
        [-1.7030, -2.4746, -2.0237, -0.3637,  0.8811,  0.7756],
        [ 0.5550,  1.1432, -1.4013, -0.4092,  0.4062, -0.4620],
        [ 1.5622, -0.3417,  2.0117,  0.5617, -1.2325,  0.0168],
        [ 1.7063, -0.2927,  1.4979,  1.9682, -0.5427,  0.3545],
        [ 1.7479, -1.7157, -2.0469,  1.5150, -1.3158, -2.0523],
        [-2.2903, -0.7475, -1.5040,  1.0942,  2.2677, -0.9673],
        [-2.1480, -2.5956, -1.9558, -1.6713,  1.8508,  0.5488],
        [ 0.4469,  1.2269, -1.2230, -0.5810, -0.3085, -0.2523],
        [ 2.0939,  0.3501,  1.9173,  0.1418, -1.7191, -1.3119],
        [ 2.6166,  0.8466,  0.7617,  0.3639, -2.1670, -1.4917],
        [ 2.4941,  0.2416, -1.1855,  1.4082, -1.9211,  0.2531],
        [-3.2459, -2.0245, -2.2683,  2.2256,  3.1043,  2.8321],
        [-2.2793, -1.8806, -2.2946,  0.1079,  1.5697,  0.3001]],
       device='cuda:0')
action: tensor([[ 9.2862e-01,  8.1047e-01, -9.6914e-01, -9.1682e-01,  3.4846e-01,
          5.0503e-01],
        [ 9.0951e-01, -1.7296e-02,  9.9461e-01,  7.0753e-01, -1.0791e-01,
          3.2341e-01],
        [-2.9983e-01, -5.1859e-01,  7.6446e-01,  8.1070e-01, -3.1567e-03,
          6.1421e-01],
        [ 9.0073e-01,  1.7099e-01, -2.3533e-02,  8.6069e-03, -4.4709e-01,
         -3.3660e-01],
        [-5.9046e-01, -5.1693e-01, -8.9520e-01, -5.4101e-04, -1.8708e-01,
         -7.0680e-01],
        [-7.4135e-01, -7.0066e-01, -9.4449e-01, -3.6793e-01,  1.5372e-01,
         -2.9188e-01],
        [ 2.9486e-01,  9.8749e-01, -9.9589e-01, -9.6457e-01, -3.6004e-01,
          4.1346e-01],
        [ 2.0466e-01, -1.9773e-01,  9.9145e-01, -9.7322e-01, -8.2212e-01,
         -8.9141e-01],
        [ 6.9215e-01, -5.4785e-01, -7.7336e-01,  7.7632e-01,  6.9353e-01,
          7.7367e-01],
        [-8.3030e-01, -6.7741e-01, -9.1433e-01,  9.2744e-01, -2.6061e-01,
          9.4038e-01],
        [-9.7609e-01, -9.8738e-01, -9.6481e-01, -4.8051e-02,  9.9488e-01,
          9.6681e-01],
        [-9.8531e-01, -7.4357e-01, -8.9754e-01,  7.7344e-01,  9.3059e-01,
          7.6417e-01],
        [ 9.8994e-01, -7.7776e-01,  9.7581e-01,  9.3832e-01,  9.5015e-01,
          2.4092e-01],
        [ 9.6450e-01, -2.6145e-01,  9.8888e-01,  6.9659e-01, -7.5283e-01,
         -5.9673e-01],
        [ 9.8008e-01, -3.2705e-01,  9.7798e-01, -1.4749e-01, -9.1094e-01,
         -4.6283e-01],
        [ 9.6691e-01,  6.9837e-01,  9.4958e-01,  3.1683e-01, -8.8000e-01,
         -6.6740e-01],
        [ 9.7726e-01,  1.1095e-01, -1.4490e-01, -1.7078e-01, -9.7498e-01,
         -9.3823e-01],
        [-9.6686e-01, -9.6222e-01, -9.9692e-01,  3.5708e-01,  9.4135e-01,
          2.3846e-01],
        [-9.4133e-01, -9.9632e-01, -9.6462e-01, -7.6663e-01,  9.0343e-01,
          3.2849e-01],
        [ 9.5227e-01,  5.6724e-01, -5.2485e-01, -1.6933e-01,  6.7521e-01,
          5.1212e-01]], device='cuda:0')
squash tensor([[ 1.6482e+00,  1.1284e+00, -2.0779e+00, -1.5687e+00,  3.6369e-01,
          5.5604e-01],
        [ 1.5247e+00, -1.7298e-02,  2.9569e+00,  8.8223e-01, -1.0833e-01,
          3.3545e-01],
        [-3.0934e-01, -5.7441e-01,  1.0069e+00,  1.1291e+00, -3.1567e-03,
          7.1566e-01],
        [ 1.4761e+00,  1.7269e-01, -2.3538e-02,  8.6071e-03, -4.8106e-01,
         -3.5025e-01],
        [-6.7838e-01, -5.7214e-01, -1.4475e+00, -5.4101e-04, -1.8931e-01,
         -8.8077e-01],
        [-9.5348e-01, -8.6860e-01, -1.7781e+00, -3.8603e-01,  1.5495e-01,
         -3.0062e-01],
        [ 3.0389e-01,  2.5340e+00, -3.0922e+00, -2.0077e+00, -3.7693e-01,
          4.3977e-01],
        [ 2.0759e-01, -2.0037e-01,  2.7254e+00, -2.1499e+00, -1.1633e+00,
         -1.4288e+00],
        [ 8.5207e-01, -6.1530e-01, -1.0286e+00,  1.0360e+00,  8.5472e-01,
          1.0294e+00],
        [-1.1891e+00, -8.2432e-01, -1.5533e+00,  1.6398e+00, -2.6677e-01,
          1.7413e+00],
        [-2.2074e+00, -2.5297e+00, -2.0111e+00, -4.8088e-02,  2.9825e+00,
          2.0409e+00],
        [-2.4533e+00, -9.5843e-01, -1.4594e+00,  1.0288e+00,  1.6628e+00,
          1.0062e+00],
        [ 2.6434e+00, -1.0397e+00,  2.2013e+00,  1.7238e+00,  1.8333e+00,
          2.4575e-01],
        [ 2.0067e+00, -2.6766e-01,  2.5931e+00,  8.6064e-01, -9.7945e-01,
         -6.8806e-01],
        [ 2.2995e+00, -3.3952e-01,  2.2490e+00, -1.4857e-01, -1.5330e+00,
         -5.0090e-01],
        [ 2.0425e+00,  8.6411e-01,  1.8275e+00,  3.2812e-01, -1.3758e+00,
         -8.0605e-01],
        [ 2.2326e+00,  1.1141e-01, -1.4593e-01, -1.7247e-01, -2.1843e+00,
         -1.7230e+00],
        [-2.0418e+00, -1.9750e+00, -3.2373e+00,  3.7354e-01,  1.7498e+00,
          2.4314e-01],
        [-1.7496e+00, -3.1476e+00, -2.0084e+00, -1.0121e+00,  1.4906e+00,
          3.4113e-01],
        [ 1.8556e+00,  6.4345e-01, -5.8302e-01, -1.7097e-01,  8.2026e-01,
          5.6559e-01]], device='cuda:0')
action: tensor([[ 0.9856, -0.4953,  0.9875, -0.0501, -0.5293, -0.5696],
        [ 0.9684, -0.0466,  0.9601, -0.5343, -0.9781, -0.9197],
        [ 0.9973,  0.2358,  0.9374,  0.2169, -0.9257, -0.9011],
        [ 0.9870,  0.4023, -0.3531,  0.3074, -0.9667, -0.1776],
        [-0.9516, -0.9729, -0.9013,  0.2574,  0.9730,  0.9235],
        [-0.9904, -0.9569, -0.9759, -0.5269,  0.9827,  0.9355],
        [ 0.9196,  0.4995, -0.3763,  0.0025,  0.8662,  0.7291],
        [ 0.9864, -0.8620,  0.9513,  0.5159, -0.8710,  0.7753],
        [ 0.9975, -0.6361,  0.9678,  0.9220, -0.8164, -0.5869],
        [ 0.8958, -0.9614, -0.8199,  0.9725, -0.6067, -0.9131],
        [-0.9919, -0.9962, -0.9398,  0.8059,  0.9524, -0.9104],
        [-0.9473, -0.9783, -0.9804, -0.8430,  0.9737,  0.8916],
        [ 0.1383,  0.9557, -0.9693, -0.8812, -0.7334, -0.1307],
        [ 0.9831,  0.6930,  0.8873,  0.1295, -0.4409,  0.6737],
        [-0.7312, -0.5431,  0.5742,  0.8335, -0.7450, -0.4806],
        [-0.7360,  0.7113, -0.5454, -0.5376, -0.4580,  0.1671],
        [ 0.8515,  0.5542, -0.8767, -0.9017, -0.8687, -0.8999],
        [ 0.9949, -0.8082,  0.9918, -0.8622, -0.9853, -0.8966],
        [ 0.9110, -0.9592, -0.5766,  0.7406, -0.9950, -0.6994],
        [-0.9988, -0.9307, -0.9696,  0.4341,  0.9824,  0.5838]],
       device='cuda:0')
squash tensor([[ 2.4634e+00, -5.4306e-01,  2.5360e+00, -5.0172e-02, -5.8917e-01,
         -6.4688e-01],
        [ 2.0661e+00, -4.6682e-02,  1.9467e+00, -5.9618e-01, -2.2517e+00,
         -1.5873e+00],
        [ 3.2953e+00,  2.4036e-01,  1.7166e+00,  2.2039e-01, -1.6276e+00,
         -1.4782e+00],
        [ 2.5129e+00,  4.2641e-01, -3.6898e-01,  3.1769e-01, -2.0396e+00,
         -1.7949e-01],
        [-1.8489e+00, -2.1431e+00, -1.4790e+00,  2.6329e-01,  2.1462e+00,
          1.6122e+00],
        [-2.6681e+00, -1.9074e+00, -2.2030e+00, -5.8585e-01,  2.3704e+00,
          1.7006e+00],
        [ 1.5863e+00,  5.4857e-01, -3.9571e-01,  2.5145e-03,  1.3176e+00,
          9.2671e-01],
        [ 2.4922e+00, -1.3009e+00,  1.8456e+00,  5.7072e-01, -1.3371e+00,
          1.0334e+00],
        [ 3.3371e+00, -7.5162e-01,  2.0564e+00,  1.6020e+00, -1.1460e+00,
         -6.7298e-01],
        [ 1.4503e+00, -1.9646e+00, -1.1564e+00,  2.1365e+00, -7.0363e-01,
         -1.5459e+00],
        [-2.7523e+00, -3.1274e+00, -1.7360e+00,  1.1152e+00,  1.8569e+00,
         -1.5298e+00],
        [-1.8044e+00, -2.2559e+00, -2.3080e+00, -1.2316e+00,  2.1587e+00,
          1.4296e+00],
        [ 1.3916e-01,  1.8941e+00, -2.0798e+00, -1.3810e+00, -9.3595e-01,
         -1.3141e-01],
        [ 2.3820e+00,  8.5366e-01,  1.4089e+00,  1.3027e-01, -4.7336e-01,
          8.1744e-01],
        [-9.3140e-01, -6.0860e-01,  6.5379e-01,  1.1995e+00, -9.6165e-01,
         -5.2372e-01],
        [-9.4176e-01,  8.8988e-01, -6.1187e-01, -6.0076e-01, -4.9480e-01,
          1.6869e-01],
        [ 1.2615e+00,  6.2444e-01, -1.3612e+00, -1.4813e+00, -1.3278e+00,
         -1.4719e+00],
        [ 2.9848e+00, -1.1218e+00,  2.7490e+00, -1.3020e+00, -2.4545e+00,
         -1.4546e+00],
        [ 1.5334e+00, -1.9361e+00, -6.5728e-01,  9.5185e-01, -2.9952e+00,
         -8.6610e-01],
        [-3.7142e+00, -1.6637e+00, -2.0857e+00,  4.6494e-01,  2.3634e+00,
          6.6814e-01]], device='cuda:0')
action: tensor([[ 0.9901,  0.3219,  0.9959, -0.5777, -0.8720,  0.0111],
        [ 0.9367,  0.6542,  0.9337,  0.3677, -0.9339, -0.9006],
        [ 0.9888,  0.4003, -0.9188,  0.2829, -0.9671, -0.9250],
        [-0.9832, -0.8741, -0.9707,  0.1253,  0.9710,  0.5145],
        [-0.9849, -0.9773, -0.9815, -0.5212,  0.9798,  0.9850],
        [ 0.8788, -0.1391, -0.4421,  0.5030,  0.7458,  0.9157],
        [ 0.9771,  0.3853,  0.9940,  0.1528, -0.9780, -0.8824],
        [ 0.9947, -0.5258,  0.9634,  0.1737, -0.9039, -0.7024],
        [ 0.8013, -0.2195, -0.6278,  0.9713, -0.9859, -0.3780],
        [-0.9915, -0.6993, -0.8990,  0.7862,  0.8725,  0.8413],
        [-0.9353, -0.9951, -0.9896, -0.7465,  0.9935,  0.8822],
        [ 0.9191,  0.6625, -0.7942, -0.0134,  0.8188,  0.4867],
        [ 0.9719,  0.1877,  0.9852,  0.6378, -0.9699, -0.4257],
        [ 0.9846,  0.6466,  0.9697,  0.2513, -0.9241, -0.9754],
        [ 0.9195,  0.3253,  0.1274,  0.8753, -0.9710,  0.2222],
        [-0.9891, -0.9849, -0.9918,  0.9475,  0.9775,  0.7545],
        [-0.9640, -0.9839, -0.9788, -0.1788,  0.9642,  0.9759],
        [ 0.8333,  0.7403, -0.7682, -0.6132,  0.5904,  0.7744],
        [ 0.8378, -0.6651,  0.9647,  0.7763, -0.2477,  0.4310],
        [ 0.9941, -0.3230,  0.9736,  0.3235, -0.9587, -0.8639]],
       device='cuda:0')
squash tensor([[ 2.6529,  0.3338,  3.0943, -0.6590, -1.3412,  0.0111],
        [ 1.7105,  0.7827,  1.6862,  0.3857, -1.6878, -1.4754],
        [ 2.5903,  0.4240, -1.5812,  0.2909, -2.0458, -1.6228],
        [-2.3852, -1.3501, -2.1041,  0.1259,  2.1102,  0.5688],
        [-2.4409, -2.2330, -2.3368, -0.5780,  2.2921,  2.4418],
        [ 1.3703, -0.1400, -0.4748,  0.5533,  0.9635,  1.5620],
        [ 2.2288,  0.4063,  2.9033,  0.1540, -2.2499, -1.3866],
        [ 2.9685, -0.5844,  1.9918,  0.1755, -1.4932, -0.8721],
        [ 1.1022, -0.2232, -0.7378,  2.1150, -2.4740, -0.3977],
        [-2.7305, -0.8660, -1.4669,  1.0613,  1.3434,  1.2255],
        [-1.6989, -3.0040, -2.6259, -0.9649,  2.8607,  1.3857],
        [ 1.5834,  0.7972, -1.0827, -0.0134,  1.1532,  0.5317],
        [ 2.1257,  0.1900,  2.4484,  0.7544, -2.0906, -0.4546],
        [ 2.4281,  0.7694,  2.0881,  0.2568, -1.6162, -2.1921],
        [ 1.5859,  0.3375,  0.1281,  1.3552, -2.1100,  0.2260],
        [-2.6015, -2.4395, -2.7445,  1.8066,  2.2383,  0.9834],
        [-1.9993, -2.4063, -2.2679, -0.1807,  2.0023,  2.2043],
        [ 1.1990,  0.9511, -1.0159, -0.7140,  0.6783,  1.0311],
        [ 1.2138, -0.8019,  2.0101,  1.0360, -0.2530,  0.4611],
        [ 2.9091, -0.3350,  2.1563,  0.3356, -1.9300, -1.3085]],
       device='cuda:0')
action: tensor([[ 0.9712,  0.2881, -0.8640,  0.7541, -0.9455,  0.3082],
        [-0.9967, -0.9814, -0.9730,  0.8802,  0.9784,  0.9834],
        [-0.9450, -0.8892, -0.7448,  0.0600,  0.9783,  0.6240],
        [ 0.3694, -0.9325,  0.1987,  0.5409,  0.7457, -0.0642],
        [-0.4781, -0.0132,  0.8789,  0.8211, -0.9205,  0.9982],
        [-0.9726,  0.8176, -0.9908, -0.9710, -0.4677, -0.9010],
        [ 0.4995,  0.6477, -0.9838, -0.6948,  0.2657,  0.9558],
        [ 0.9969, -0.7977,  0.9734, -0.9768, -0.9799, -0.9706],
        [ 0.9999,  0.9076, -0.2806,  0.7769, -0.9968, -0.9668],
        [-0.9655, -0.8716, -0.9888, -0.2004,  0.9897,  0.7838],
        [-0.9518, -0.9654, -0.8383, -0.4969,  0.9748,  0.9460],
        [ 0.9246,  0.4468, -0.7297,  0.2291,  0.7314,  0.2159],
        [ 0.9872, -0.6520,  0.9922,  0.3979, -0.8765, -0.8875],
        [ 0.9949,  0.6992,  0.9600,  0.5885, -0.9957, -0.6712],
        [ 0.9915,  0.5690, -0.3671,  0.9620, -0.9236, -0.1337],
        [-0.9987, -0.8504, -0.9780,  0.8753,  0.9891,  0.9318],
        [-0.9585, -0.9759, -0.9638, -0.1958,  0.9861,  0.9837],
        [ 0.8918,  0.2370, -0.4328,  0.8209,  0.8997,  0.6263],
        [ 0.9987, -0.2823,  0.9593,  0.4229, -0.8810, -0.7593],
        [ 0.9479, -0.4464,  0.9918, -0.0336, -0.7862, -0.6450]],
       device='cuda:0')
squash tensor([[ 2.1135,  0.2965, -1.3091,  0.9823, -1.7877,  0.3186],
        [-3.1970, -2.3343, -2.1450,  1.3766,  2.2579,  2.3902],
        [-1.7827, -1.4183, -0.9612,  0.0600,  2.2560,  0.7315],
        [ 0.3877, -1.6769,  0.2014,  0.6054,  0.9632, -0.0643],
        [-0.5205, -0.0132,  1.3711,  1.1601, -1.5923,  3.5137],
        [-2.1382,  1.1495, -2.6903, -2.1101, -0.5072, -1.4775],
        [ 0.5486,  0.7713, -2.4038, -0.8572,  0.2723,  1.8944],
        [ 3.2300, -1.0922,  2.1529, -2.2231, -2.2959, -2.1033],
        [ 4.9881,  1.5136, -0.2883,  1.0374, -3.2104, -2.0414],
        [-2.0213, -1.3397, -2.5916, -0.2032,  2.6340,  1.0550],
        [-1.8503, -2.0202, -1.2153, -0.5451,  2.1806,  1.7921],
        [ 1.6198,  0.4807, -0.9281,  0.2332,  0.9317,  0.2194],
        [ 2.5210, -0.7788,  2.7742,  0.4212, -1.3604, -1.4101],
        [ 2.9869,  0.8658,  1.9461,  0.6754, -3.0672, -0.8128],
        [ 2.7300,  0.6461, -0.3850,  1.9723, -1.6130, -0.1345],
        [-3.6690, -1.2576, -2.2496,  1.3552,  2.6053,  1.6715],
        [-1.9272, -2.2036, -1.9965, -0.1984,  2.4796,  2.4017],
        [ 1.4307,  0.2416, -0.4633,  1.1596,  1.4704,  0.7354],
        [ 3.6523, -0.2902,  1.9376,  0.4513, -1.3801, -0.9945],
        [ 1.8110, -0.4801,  2.7472, -0.0336, -1.0615, -0.7667]],
       device='cuda:0')
action: tensor([[ 0.4625, -0.9573, -0.9612,  0.9982, -0.8200, -0.9520],
        [-0.9952, -0.9553, -0.9422,  0.9757,  0.9824,  0.8253],
        [-0.9821, -0.9912, -0.9377, -0.8695,  0.9697,  0.6780],
        [ 0.1050,  0.8256, -0.9788, -0.7777, -0.4583, -0.3143],
        [ 0.9351,  0.7222,  0.9559,  0.7788, -0.8128,  0.6330],
        [ 0.9384, -0.1852,  0.9702,  0.8790, -0.8975, -0.6122],
        [ 0.9884, -0.8545, -0.8687,  0.9792, -0.9713, -0.9720],
        [-0.9604, -0.9458, -0.9332,  0.4852,  0.9087, -0.8301],
        [-0.8793, -0.9264, -0.9396, -0.8058,  0.8434,  0.8683],
        [ 0.3568,  0.7877, -0.9752, -0.7230,  0.2889,  0.4784],
        [ 0.9968, -0.1964,  0.9407,  0.3717, -0.8181, -0.7666],
        [ 0.9709,  0.2015,  0.9804,  0.2614, -0.8883, -0.5964],
        [ 0.9892,  0.5094, -0.2262,  0.8307, -0.9549, -0.7508],
        [-0.9959, -0.9826, -0.9178,  0.5124,  0.9283,  0.4207],
        [-0.9017, -0.7955, -0.9845, -0.4914,  0.9729,  0.6790],
        [ 0.9741,  0.5949, -0.6608, -0.1327,  0.8978, -0.6007],
        [ 0.9970, -0.4764,  0.9995,  0.2347, -0.9207, -0.2126],
        [ 0.9957,  0.3370,  0.9946, -0.5580, -0.8676, -0.9556],
        [ 0.9290,  0.5488,  0.8527,  0.1622, -0.9570, -0.3077],
        [ 0.9721,  0.1066, -0.9153, -0.1771, -0.9401, -0.9604]],
       device='cuda:0')
squash tensor([[ 0.5005, -1.9131, -1.9616,  3.4978, -1.1568, -1.8522],
        [-3.0125, -1.8888, -1.7577,  2.1999,  2.3608,  1.1732],
        [-2.3522, -2.7116, -1.7187, -1.3310,  2.0879,  0.8255],
        [ 0.1054,  1.1743, -2.2681, -1.0396, -0.4952, -0.3253],
        [ 1.6972,  0.9122,  1.8962,  1.0423, -1.1354,  0.7464],
        [ 1.7248, -0.1874,  2.0962,  1.3714, -1.4594, -0.7124],
        [ 2.5717, -1.2725, -1.3278,  2.2782, -2.1150, -2.1279],
        [-1.9512, -1.7906, -1.6827,  0.5298,  1.5199, -1.1886],
        [-1.3728, -1.6321, -1.7346, -1.1150,  1.2329,  1.3260],
        [ 0.3732,  1.0654, -2.1887, -0.9140,  0.2974,  0.5210],
        [ 3.2164, -0.1990,  1.7438,  0.3903, -1.1509, -1.0120],
        [ 2.1080,  0.2043,  2.3073,  0.2677, -1.4137, -0.6875],
        [ 2.6074,  0.5620, -0.2302,  1.1903, -1.8841, -0.9747],
        [-3.0967, -2.3689, -1.5752,  0.5660,  1.6457,  0.4485],
        [-1.4813, -1.0862, -2.4253, -0.5379,  2.1432,  0.8273],
        [ 2.1668,  0.6853, -0.7943, -0.1335,  1.4605, -0.6943],
        [ 3.2573, -0.5184,  4.1731,  0.2391, -1.5939, -0.2159],
        [ 3.0644,  0.3507,  2.9556, -0.6299, -1.3233, -1.8922],
        [ 1.6513,  0.6167,  1.2659,  0.1637, -1.9090, -0.3180],
        [ 2.1286,  0.1070, -1.5594, -0.1790, -1.7390, -1.9513]],
       device='cuda:0')
action: tensor([[ 0.9855, -0.0291, -0.9017,  0.2213, -0.9447, -0.9785],
        [-0.9301, -0.9907, -0.9641,  0.3537,  0.9343, -0.9303],
        [-0.7894, -0.9595, -0.9127, -0.7887,  0.9379,  0.6594],
        [ 0.5724,  0.7177, -0.9060, -0.8823, -0.3501, -0.3041],
        [ 0.9517,  0.2435,  0.9908,  0.2422, -0.9347, -0.7060],
        [ 0.9910,  0.4841,  0.9774,  0.0999, -0.6886, -0.6530],
        [ 0.9498, -0.3579, -0.9575,  0.8909, -0.9747, -0.8901],
        [-0.9868, -0.9335, -0.7128,  0.6498,  0.9795,  0.6016],
        [-0.9449, -0.9958, -0.9719, -0.6727,  0.9533,  0.6121],
        [ 0.5443,  0.6715, -0.4665, -0.2916,  0.3107, -0.1408],
        [ 0.9819, -0.2598,  0.9957,  0.0721, -0.5893, -0.4217],
        [ 0.9693,  0.1699,  0.9292, -0.0286, -0.8145,  0.2886],
        [ 0.9776,  0.2944,  0.0639,  0.3388, -0.9095, -0.9446],
        [ 0.8611, -0.5100, -0.5229,  0.5034, -0.7891, -0.9254],
        [-0.9687, -0.9918, -0.9633,  0.2223,  0.9870,  0.4204],
        [-0.9063, -0.9901, -0.9680, -0.7309,  0.9536,  0.7816],
        [ 0.9338,  0.7222, -0.2987,  0.0338,  0.5433,  0.4663],
        [ 0.9722, -0.4197,  0.9847,  0.7162, -0.9714, -0.6921],
        [ 0.9658, -0.0562,  0.1846,  0.8223, -0.9937, -0.5039],
        [ 0.7707, -0.7277, -0.9263,  0.9866, -0.9406,  0.9096]],
       device='cuda:0')
squash tensor([[ 2.4613, -0.0291, -1.4812,  0.2250, -1.7797, -2.2607],
        [-1.6590, -2.6846, -2.0004,  0.3696,  1.6912, -1.6603],
        [-1.0699, -1.9400, -1.5435, -1.0680,  1.7202,  0.7918],
        [ 0.6511,  0.9029, -1.5045, -1.3859, -0.3655, -0.3141],
        [ 1.8491,  0.2485,  2.6876,  0.2472, -1.6947, -0.8792],
        [ 2.6983,  0.5284,  2.2360,  0.1003, -0.8453, -0.7805],
        [ 1.8301, -0.3745, -1.9152,  1.4261, -2.1781, -1.4225],
        [-2.5086, -1.6850, -0.8928,  0.7749,  2.2862,  0.6956],
        [-1.7821, -3.0791, -2.1260, -0.8157,  1.8663,  0.7122],
        [ 0.6103,  0.8134, -0.5056, -0.3003,  0.3213, -0.1418],
        [ 2.3483, -0.2659,  3.0705,  0.0722, -0.6766, -0.4497],
        [ 2.0811,  0.1715,  1.6528, -0.0286, -1.1401,  0.2970],
        [ 2.2392,  0.3033,  0.0640,  0.3527, -1.5248, -1.7789],
        [ 1.2977, -0.5628, -0.5803,  0.5538, -1.0689, -1.6251],
        [-2.0705, -2.7438, -1.9894,  0.2261,  2.5133,  0.4482],
        [-1.5062, -2.6532, -2.0601, -0.9307,  1.8706,  1.0495],
        [ 1.6875,  0.9123, -0.3081,  0.0338,  0.6088,  0.5054],
        [ 2.1311, -0.4473,  2.4337,  0.8999, -2.1162, -0.8520],
        [ 2.0255, -0.0563,  0.1867,  1.1640, -2.8793, -0.5545],
        [ 1.0220, -0.9238, -1.6316,  2.4986, -1.7430,  1.5251]],
       device='cuda:0')
action: tensor([[ 9.9508e-01,  8.0743e-01,  9.3149e-01,  5.1187e-01, -7.2670e-01,
         -9.8953e-01],
        [ 4.9572e-01,  8.2886e-02, -8.1280e-01,  3.9642e-01, -9.7772e-01,
         -6.9886e-01],
        [-9.5028e-01, -9.9116e-01, -9.4918e-01,  1.0169e-01,  9.9283e-01,
          2.7623e-01],
        [-9.0171e-01, -8.9046e-01, -9.2828e-01, -6.0488e-01,  9.3963e-01,
          4.1200e-01],
        [ 9.7980e-01,  7.2652e-01, -1.6234e-02,  5.0219e-02,  8.9570e-01,
          1.0161e-01],
        [ 9.6299e-01, -2.0265e-02,  9.8700e-01,  7.0954e-02, -7.5810e-01,
         -9.1262e-01],
        [ 9.4533e-01,  3.3741e-01,  9.7710e-01,  2.9575e-01, -9.8511e-01,
         -7.7316e-01],
        [ 9.7032e-01, -2.0061e-01, -8.0634e-01,  8.7686e-01, -7.1851e-01,
         -9.5970e-02],
        [-9.4055e-01, -9.2124e-01, -9.4861e-01,  5.3135e-01,  9.6557e-01,
          6.7869e-01],
        [-8.4971e-01, -9.7689e-01, -8.5230e-01, -6.9304e-01,  9.6487e-01,
          6.7147e-01],
        [ 9.0944e-01,  8.6544e-01, -9.6006e-01, -7.2617e-01,  6.9225e-01,
          4.9662e-01],
        [ 9.8816e-01, -3.2410e-01,  9.5361e-01,  9.6049e-03,  2.4558e-01,
          1.4558e-01],
        [ 9.5408e-01,  3.1226e-01,  9.5342e-01, -4.3596e-01, -5.6408e-01,
         -6.4594e-01],
        [ 9.7078e-01,  7.8186e-01,  9.2055e-01, -1.5836e-01, -5.1102e-01,
         -9.0095e-01],
        [ 9.8338e-01,  1.8446e-01, -8.3980e-01,  9.3752e-02, -8.4869e-01,
         -8.4786e-01],
        [-9.9555e-01, -8.7431e-01, -9.8045e-01,  7.4692e-05,  9.3533e-01,
         -6.2707e-01],
        [-9.8146e-01, -9.7644e-01, -9.5245e-01, -3.8744e-01,  9.8435e-01,
          9.5845e-01],
        [ 7.6350e-01, -2.4691e-01, -7.5649e-01, -2.9632e-01,  9.1974e-01,
         -3.2300e-01],
        [ 9.8835e-01,  1.5303e-01,  9.7141e-01, -3.0023e-01, -6.4594e-01,
         -5.3762e-01],
        [ 9.4283e-01, -1.8813e-01,  8.8607e-01,  5.4500e-01, -6.2530e-02,
         -1.6381e-01]], device='cuda:0')
squash tensor([[ 3.0027e+00,  1.1196e+00,  1.6695e+00,  5.6526e-01, -9.2169e-01,
         -2.6233e+00],
        [ 5.4362e-01,  8.3077e-02, -1.1352e+00,  4.1939e-01, -2.2431e+00,
         -8.6507e-01],
        [-1.8346e+00, -2.7084e+00, -1.8235e+00,  1.0204e-01,  2.8138e+00,
          2.8359e-01],
        [-1.4813e+00, -1.4241e+00, -1.6458e+00, -7.0081e-01,  1.7349e+00,
          4.3802e-01],
        [ 2.2925e+00,  9.2132e-01, -1.6235e-02,  5.0262e-02,  1.4500e+00,
          1.0196e-01],
        [ 1.9855e+00, -2.0268e-02,  2.5147e+00,  7.1073e-02, -9.9173e-01,
         -1.5430e+00],
        [ 1.7859e+00,  3.5116e-01,  2.2290e+00,  3.0486e-01, -2.4463e+00,
         -1.0281e+00],
        [ 2.0978e+00, -2.0336e-01, -1.1165e+00,  1.3620e+00, -9.0455e-01,
         -9.6266e-02],
        [-1.7428e+00, -1.5972e+00, -1.8178e+00,  5.9202e-01,  2.0223e+00,
          8.2669e-01],
        [-1.2551e+00, -2.2245e+00, -1.2645e+00, -8.5378e-01,  2.0121e+00,
          8.1342e-01],
        [ 1.5243e+00,  1.3146e+00, -1.9467e+00, -9.2057e-01,  8.5226e-01,
          5.4481e-01],
        [ 2.5617e+00, -3.3622e-01,  1.8702e+00,  9.6052e-03,  2.5070e-01,
          1.4663e-01],
        [ 1.8753e+00,  3.2304e-01,  1.8681e+00, -4.6723e-01, -6.3880e-01,
         -7.6830e-01],
        [ 2.1057e+00,  1.0501e+00,  1.5926e+00, -1.5971e-01, -5.6411e-01,
         -1.4773e+00],
        [ 2.3911e+00,  1.8659e-01, -1.2205e+00,  9.4028e-02, -1.2514e+00,
         -1.2485e+00],
        [-3.0531e+00, -1.3511e+00, -2.3091e+00,  7.4692e-05,  1.6993e+00,
         -7.3658e-01],
        [-2.3358e+00, -2.2148e+00, -1.8575e+00, -4.0879e-01,  2.4213e+00,
          1.9265e+00],
        [ 1.0046e+00, -2.5212e-01, -9.8796e-01, -3.0548e-01,  1.5873e+00,
         -3.3499e-01],
        [ 2.5698e+00,  1.5424e-01,  2.1168e+00, -3.0977e-01, -7.6830e-01,
         -6.0081e-01],
        [ 1.7630e+00, -1.9040e-01,  1.4033e+00,  6.1125e-01, -6.2611e-02,
         -1.6530e-01]], device='cuda:0')
action: tensor([[-0.9943, -0.9766, -0.7840,  0.1256,  0.9606, -0.0551],
        [-0.9846, -0.9941, -0.8309, -0.4520,  0.9796,  0.9688],
        [ 0.9521,  0.7377,  0.0464,  0.0043,  0.9327,  0.8761],
        [ 0.9974, -0.0668,  0.9962,  0.5025, -0.9964, -0.8276],
        [ 0.9973,  0.3408,  0.6863,  0.7373, -0.9830, -0.6329],
        [ 0.8066, -0.6288, -0.8832,  0.9866, -0.7558, -0.6252],
        [-0.9646, -0.9921, -0.9880,  0.9913,  0.9959,  0.9570],
        [-0.9761, -0.9543, -0.9774, -0.3501,  0.9824,  0.3011],
        [ 0.7517,  0.7914, -0.8901, -0.6367,  0.7083,  0.5651],
        [ 0.9383, -0.2116,  0.9830,  0.7045, -0.4605,  0.1000],
        [ 0.9294, -0.0929,  0.8324,  0.4867, -0.3940, -0.2574],
        [ 0.9978, -0.7401,  0.7501,  0.8112, -0.8320, -0.7317],
        [ 0.3481, -0.9020, -0.6054,  0.2394, -0.5562, -0.9704],
        [-0.9988, -0.9915, -0.9885,  0.4397,  0.9885, -0.8772],
        [-0.6790, -0.9967, -0.8908, -0.9475,  0.8489,  0.5705],
        [ 0.9776,  0.9602,  0.0772, -0.2415, -0.5200, -0.3968],
        [ 0.9499, -0.2661,  0.9170,  0.3089, -0.9604, -0.9131],
        [ 0.9694,  0.4102,  0.6477,  0.1470, -0.9632, -0.5692],
        [ 0.9703,  0.4355, -0.7543,  0.9088, -0.9845, -0.4423],
        [-0.9953, -0.9948, -0.9828,  0.9054,  0.9870,  0.9524]],
       device='cuda:0')
squash tensor([[-2.9290, -2.2187, -1.0558,  0.1263,  1.9534, -0.0551],
        [-2.4308, -2.9112, -1.1909, -0.4872,  2.2867,  2.0725],
        [ 1.8537,  0.9454,  0.0464,  0.0043,  1.6786,  1.3588],
        [ 3.3279, -0.0669,  3.1276,  0.5527, -3.1617, -1.1806],
        [ 3.3058,  0.3550,  0.8408,  0.9445, -2.3808, -0.7462],
        [ 1.1173, -0.7395, -1.3902,  2.4992, -0.9864, -0.7335],
        [-2.0087, -2.7652, -2.5567,  2.7190,  3.0950,  1.9089],
        [-2.2076, -1.8775, -2.2368, -0.3656,  2.3610,  0.3108],
        [ 0.9769,  1.0752, -1.4225, -0.7526,  0.8837,  0.6403],
        [ 1.7237, -0.2148,  2.3788,  0.8762, -0.4979,  0.1003],
        [ 1.6539, -0.0932,  1.1958,  0.5318, -0.4166, -0.2633],
        [ 3.4015, -0.9506,  0.9731,  1.1306, -1.1945, -0.9324],
        [ 0.3633, -1.4829, -0.7016,  0.2441, -0.6273, -2.0984],
        [-3.7136, -2.7306, -2.5779,  0.4719,  2.5762, -1.3636],
        [-0.8273, -3.2047, -1.4260, -1.8064,  1.2523,  0.6483],
        [ 2.2407,  1.9491,  0.0774, -0.2464, -0.5764, -0.4198],
        [ 1.8303, -0.2726,  1.5695,  0.3194, -1.9511, -1.5456],
        [ 2.0830,  0.4358,  0.7714,  0.1481, -1.9879, -0.6463],
        [ 2.0979,  0.4667, -0.9828,  1.5203, -2.4271, -0.4751],
        [-3.0270, -2.9701, -2.3735,  1.5015,  2.5150,  1.8573]],
       device='cuda:0')
action: tensor([[ 0.8772, -0.1950,  0.4061,  0.9459,  0.9153,  0.6813],
        [ 0.9816,  0.2777,  0.9861,  0.7260, -0.9034, -0.4125],
        [ 0.9689,  0.5470,  0.9167,  0.8195, -0.9836, -0.6486],
        [ 0.9629,  0.0370, -0.9561,  0.9520, -0.9383,  0.6981],
        [-0.9838, -0.9367, -0.9741,  0.9826,  0.9951,  0.9561],
        [-0.8798, -0.9748, -0.9582,  0.0479,  0.5084,  0.9043],
        [ 0.7561, -0.2850, -0.6970,  0.1795,  0.5417,  0.4704],
        [ 0.9324,  0.2735,  0.9311,  0.7132, -0.8731,  0.5958],
        [-0.8739, -0.8684, -0.1475,  0.5660, -0.6191,  0.3432],
        [-0.9616,  0.5136, -0.9262, -0.7413, -0.8972,  0.4644],
        [ 0.9471,  0.9843, -0.7696, -0.7895, -0.9059, -0.9217],
        [ 0.9988, -0.4714,  0.8139, -0.9847, -0.8867, -0.9114],
        [ 0.8562,  0.6962, -0.4529,  0.1310, -0.9916, -0.9489],
        [-0.9949, -0.6860, -0.9536,  0.6384,  0.9787,  0.7317],
        [-0.8729, -0.8534, -0.9235, -0.7916,  0.9393,  0.9025],
        [ 0.8454,  0.7677, -0.7440,  0.1373,  0.8267,  0.2837],
        [ 0.9982,  0.1569,  0.9945,  0.2889, -0.9528, -0.3784],
        [ 0.9637,  0.0014,  0.8529,  0.3724, -0.9751,  0.4659],
        [ 0.9512,  0.0646, -0.6275,  0.8540, -0.9475, -0.5131],
        [-0.9983, -0.8579, -0.9801,  0.8916,  0.9823,  0.9653]],
       device='cuda:0')
squash tensor([[ 1.3635e+00, -1.9749e-01,  4.3098e-01,  1.7913e+00,  1.5594e+00,
          8.3151e-01],
        [ 2.3407e+00,  2.8520e-01,  2.4818e+00,  9.2021e-01, -1.4902e+00,
         -4.3866e-01],
        [ 2.0743e+00,  6.1411e-01,  1.5678e+00,  1.1553e+00, -2.3981e+00,
         -7.7282e-01],
        [ 1.9844e+00,  3.7064e-02, -1.8987e+00,  1.8530e+00, -1.7233e+00,
          8.6365e-01],
        [-2.4054e+00, -1.7108e+00, -2.1666e+00,  2.3666e+00,  3.0069e+00,
          1.8983e+00],
        [-1.3750e+00, -2.1807e+00, -1.9237e+00,  4.7903e-02,  5.6058e-01,
          1.4953e+00],
        [ 9.8707e-01, -2.9310e-01, -8.6141e-01,  1.8150e-01,  6.0659e-01,
          5.1057e-01],
        [ 1.6767e+00,  2.8060e-01,  1.6663e+00,  8.9360e-01, -1.3458e+00,
          6.8666e-01],
        [-1.3493e+00, -1.3265e+00, -1.4855e-01,  6.4164e-01, -7.2362e-01,
          3.5777e-01],
        [-1.9671e+00,  5.6767e-01, -1.6306e+00, -9.5335e-01, -1.4579e+00,
          5.0293e-01],
        [ 1.8032e+00,  2.4191e+00, -1.0192e+00, -1.0701e+00, -1.5044e+00,
         -1.6000e+00],
        [ 3.7257e+00, -5.1190e-01,  1.1385e+00, -2.4328e+00, -1.4064e+00,
         -1.5357e+00],
        [ 1.2788e+00,  8.5980e-01, -4.8828e-01,  1.3176e-01, -2.7364e+00,
         -1.8209e+00],
        [-2.9874e+00, -8.4039e-01, -1.8697e+00,  7.5549e-01,  2.2646e+00,
          9.3228e-01],
        [-1.3450e+00, -1.2684e+00, -1.6124e+00, -1.0757e+00,  1.7319e+00,
          1.4857e+00],
        [ 1.2399e+00,  1.0147e+00, -9.5947e-01,  1.3817e-01,  1.1775e+00,
          2.9171e-01],
        [ 3.4965e+00,  1.5824e-01,  2.9453e+00,  2.9734e-01, -1.8612e+00,
         -3.9822e-01],
        [ 1.9956e+00,  1.3734e-03,  1.2668e+00,  3.9120e-01, -2.1867e+00,
          5.0488e-01],
        [ 1.8444e+00,  6.4713e-02, -7.3735e-01,  1.2707e+00, -1.8063e+00,
         -5.6696e-01],
        [-3.5277e+00, -1.2854e+00, -2.2995e+00,  1.4296e+00,  2.3598e+00,
          2.0182e+00]], device='cuda:0')
action: tensor([[-0.9941, -0.9979, -0.9835, -0.7762,  0.8274,  0.9243],
        [ 0.7189, -0.1926, -0.2776,  0.3848,  0.9588,  0.0011],
        [ 0.9334, -0.0447,  0.9606, -0.0069, -0.8968, -0.7982],
        [ 0.9910, -0.5816,  0.9985, -0.0807, -0.8759, -0.4157],
        [ 0.9860,  0.7511,  0.9155,  0.2465, -0.9165, -0.2443],
        [ 0.9833,  0.2751, -0.6663,  0.2845, -0.9734, -0.8561],
        [-0.9797, -0.9264, -0.8382,  0.4894,  0.9653,  0.6596],
        [-0.9657, -0.9621, -0.9781, -0.7603,  0.9535,  0.8290],
        [ 0.6715,  0.5454, -0.8655, -0.7062,  0.4421,  0.0442],
        [ 0.9781,  0.0028,  0.9715,  0.8486, -0.9443, -0.5690],
        [ 0.9921,  0.5267,  0.9546,  0.4580, -0.9899, -0.7290],
        [ 0.9909,  0.2319, -0.9634,  0.9393, -0.4178, -0.5225],
        [-0.9929, -0.9691, -0.9838,  0.6370,  0.9514,  0.7021],
        [-0.8866, -0.9714, -0.9652, -0.3752,  0.5439,  0.3509],
        [ 0.8902,  0.8337, -0.6114, -0.2226,  0.7590,  0.2184],
        [ 0.9834, -0.7534,  0.9833,  0.4276, -0.8156, -0.0349],
        [ 0.9545, -0.2685,  0.9851,  0.1253, -0.8874, -0.5406],
        [ 0.9871,  0.2171,  0.9133,  0.5113, -0.9770, -0.6850],
        [-0.5670, -0.7549, -0.9040,  0.5160, -0.2626,  0.0600],
        [-0.9719, -0.9924, -0.7727,  0.1443,  0.9309,  0.7833]],
       device='cuda:0')
squash tensor([[-2.9091e+00, -3.4324e+00, -2.3958e+00, -1.0356e+00,  1.1799e+00,
          1.6179e+00],
        [ 9.0534e-01, -1.9499e-01, -2.8511e-01,  4.0570e-01,  1.9305e+00,
          1.1419e-03],
        [ 1.6842e+00, -4.4731e-02,  1.9535e+00, -6.8519e-03, -1.4558e+00,
         -1.0938e+00],
        [ 2.7008e+00, -6.6480e-01,  3.6030e+00, -8.0881e-02, -1.3578e+00,
         -4.4251e-01],
        [ 2.4757e+00,  9.7548e-01,  1.5603e+00,  2.5171e-01, -1.5664e+00,
         -2.4935e-01],
        [ 2.3877e+00,  2.8242e-01, -8.0414e-01,  2.9258e-01, -2.1528e+00,
         -1.2784e+00],
        [-2.2898e+00, -1.6326e+00, -1.2151e+00,  5.3523e-01,  2.0181e+00,
          7.9214e-01],
        [-2.0249e+00, -1.9739e+00, -2.2517e+00, -9.9685e-01,  1.8694e+00,
          1.1850e+00],
        [ 8.1341e-01,  6.1184e-01, -1.3151e+00, -8.7957e-01,  4.7485e-01,
          4.4275e-02],
        [ 2.2514e+00,  2.7591e-03,  2.1185e+00,  1.2513e+00, -1.7765e+00,
         -6.4598e-01],
        [ 2.7648e+00,  5.8561e-01,  1.8811e+00,  4.9480e-01, -2.6411e+00,
         -9.2649e-01],
        [ 2.6925e+00,  2.3620e-01, -1.9917e+00,  1.7324e+00, -4.4498e-01,
         -5.7978e-01],
        [-2.8192e+00, -2.0776e+00, -2.4034e+00,  7.5318e-01,  1.8465e+00,
          8.7151e-01],
        [-1.4056e+00, -2.1171e+00, -2.0162e+00, -3.9448e-01,  6.0965e-01,
          3.6651e-01],
        [ 1.4227e+00,  1.2002e+00, -7.1113e-01, -2.2643e-01,  9.9391e-01,
          2.2199e-01],
        [ 2.3917e+00, -9.8068e-01,  2.3891e+00,  4.5693e-01, -1.1436e+00,
         -3.4897e-02],
        [ 1.8805e+00, -2.7521e-01,  2.4458e+00,  1.2592e-01, -1.4095e+00,
         -6.0501e-01],
        [ 2.5178e+00,  2.2061e-01,  1.5472e+00,  5.6450e-01, -2.2259e+00,
         -8.3842e-01],
        [-6.4307e-01, -9.8430e-01, -1.4935e+00,  5.7086e-01, -2.6885e-01,
          6.0034e-02],
        [-2.1257e+00, -2.7829e+00, -1.0271e+00,  1.4531e-01,  1.6651e+00,
          1.0538e+00]], device='cuda:0')
action: tensor([[ 0.9554, -0.5476,  0.8194,  0.8588, -0.9070, -0.9136],
        [ 0.6308, -0.4800, -0.2743,  0.2829, -0.9306, -0.9924],
        [-0.8865, -0.9888, -0.5882,  0.4077,  0.9579, -0.8694],
        [-0.9463, -0.8992, -0.7099, -0.7909,  0.9617,  0.2350],
        [ 0.8314,  0.9187, -0.8188, -0.4943,  0.3604,  0.1591],
        [ 0.9928,  0.1793,  0.9871, -0.0025, -0.9477, -0.8691],
        [ 0.9855,  0.4632,  0.9608, -0.1223, -0.8368, -0.3280],
        [ 0.9967, -0.1328, -0.9593,  0.9570, -0.9674, -0.4127],
        [-0.9897, -0.9715, -0.9512,  0.4033,  0.9566,  0.2063],
        [-0.9538, -0.9502, -0.9474, -0.1776,  0.9483,  0.6508],
        [ 0.9634,  0.3227, -0.6187, -0.1422,  0.8564,  0.2175],
        [ 0.9730, -0.3555,  0.8737,  0.7733, -0.9711, -0.8400],
        [ 0.9644,  0.0653,  0.8548,  0.6850, -0.9561, -0.8407],
        [ 0.9801, -0.1757, -0.8629,  0.9741, -0.9357,  0.1026],
        [-0.9513, -0.9945, -0.8766,  0.9582,  0.9891,  0.9366],
        [-0.9917, -0.9573, -0.9965, -0.2867,  0.9770,  0.9139],
        [ 0.9871,  0.8473, -0.9862, -0.2632,  0.4615,  0.8724],
        [ 0.8274, -0.3634,  0.9582,  0.3171, -0.8459, -0.2892],
        [ 0.9611,  0.1709,  0.9813, -0.5228, -0.8064, -0.6535],
        [ 0.9788,  0.4381,  0.9030,  0.6163, -0.9485,  0.1800]],
       device='cuda:0')
squash tensor([[ 1.8904e+00, -6.1489e-01,  1.1550e+00,  1.2889e+00, -1.5101e+00,
         -1.5488e+00],
        [ 7.4276e-01, -5.2302e-01, -2.8148e-01,  2.9082e-01, -1.6626e+00,
         -2.7852e+00],
        [-1.4055e+00, -2.5907e+00, -6.7488e-01,  4.3280e-01,  1.9201e+00,
         -1.3306e+00],
        [-1.7951e+00, -1.4682e+00, -8.8705e-01, -1.0737e+00,  1.9682e+00,
          2.3947e-01],
        [ 1.1927e+00,  1.5807e+00, -1.1530e+00, -5.4174e-01,  3.7737e-01,
          1.6045e-01],
        [ 2.8113e+00,  1.8129e-01,  2.5198e+00, -2.4995e-03, -1.8087e+00,
         -1.3295e+00],
        [ 2.4597e+00,  5.0133e-01,  1.9557e+00, -1.2294e-01, -1.2105e+00,
         -3.4058e-01],
        [ 3.2017e+00, -1.3357e-01, -1.9369e+00,  1.9091e+00, -2.0506e+00,
         -4.3884e-01],
        [-2.6309e+00, -2.1183e+00, -1.8445e+00,  4.2763e-01,  1.9044e+00,
          2.0930e-01],
        [-1.8722e+00, -1.8337e+00, -1.8055e+00, -1.7955e-01,  1.8143e+00,
          7.7662e-01],
        [ 1.9906e+00,  3.3464e-01, -7.2283e-01, -1.4319e-01,  1.2795e+00,
          2.2100e-01],
        [ 2.1462e+00, -3.7170e-01,  1.3485e+00,  1.0286e+00, -2.1105e+00,
         -1.2211e+00],
        [ 2.0058e+00,  6.5367e-02,  1.2738e+00,  8.3850e-01, -1.8980e+00,
         -1.2234e+00],
        [ 2.3009e+00, -1.7758e-01, -1.3047e+00,  2.1669e+00, -1.7027e+00,
          1.0292e-01],
        [-1.8451e+00, -2.9423e+00, -1.3610e+00,  1.9236e+00,  2.6047e+00,
          1.7099e+00],
        [-2.7421e+00, -1.9130e+00, -3.1758e+00, -2.9499e-01,  2.2274e+00,
          1.5504e+00],
        [ 2.5172e+00,  1.2463e+00, -2.4860e+00, -2.6949e-01,  4.9917e-01,
          1.3429e+00],
        [ 1.1798e+00, -3.8084e-01,  1.9236e+00,  3.2839e-01, -1.2416e+00,
         -2.9774e-01],
        [ 1.9605e+00,  1.7261e-01,  2.3322e+00, -5.8015e-01, -1.1166e+00,
         -7.8130e-01],
        [ 2.2691e+00,  4.6993e-01,  1.4884e+00,  7.1894e-01, -1.8171e+00,
          1.8199e-01]], device='cuda:0')
action: tensor([[-0.9911, -0.9718, -0.9860,  0.8096,  0.8670,  0.5209],
        [-0.9465, -0.9778, -0.9172, -0.9052,  0.9073,  0.9231],
        [ 0.9756,  0.2250, -0.5035,  0.9224,  0.7533, -0.2435],
        [ 0.9976,  0.1635,  0.9731,  0.5486, -0.9006, -0.8740],
        [ 0.9807,  0.2369,  0.8928,  0.9134, -0.9275, -0.3675],
        [ 0.8224,  0.0266, -0.9007,  0.9492, -0.9034, -0.4326],
        [-0.9769, -0.9190, -0.7771,  0.9878,  0.9700,  0.8281],
        [-0.8967, -0.9825, -0.9395,  0.2652,  0.9441,  0.7626],
        [ 0.7529,  0.9607, -0.9277, -0.9803, -0.1983, -0.0111],
        [ 0.9739,  0.9107,  0.9431, -0.0536, -0.8239,  0.4136],
        [-0.9496,  0.0163, -0.8529,  0.7621,  0.8642, -0.1954],
        [-0.2129,  0.8705, -0.5942, -0.5929, -0.8733,  0.7720],
        [-0.6138,  0.8700, -0.8899, -0.9034, -0.4686, -0.6735],
        [ 0.8041,  0.9289, -0.7624, -0.9748, -0.6393, -0.6708],
        [ 0.9669, -0.7950,  0.9402, -0.9470, -0.6858, -0.7919],
        [ 0.9736, -0.7809, -0.9959,  0.8487, -0.9867, -0.8934],
        [-0.9849, -0.5130, -0.9862,  0.6570,  0.9737,  0.9442],
        [-0.9892, -0.9913, -0.8711, -0.8870,  0.9472,  0.2948],
        [-0.2387,  0.9846, -0.9490,  0.4857, -0.1427, -0.7180],
        [ 0.9601,  0.9625,  0.6532,  0.0803, -0.9290, -0.6971]],
       device='cuda:0')
squash tensor([[-2.7062, -2.1231, -2.4785,  1.1257,  1.3207,  0.5776],
        [-1.7967, -2.2456, -1.5714, -1.5001,  1.5119,  1.6098],
        [ 2.1962,  0.2289, -0.5540,  1.6047,  0.9805, -0.2485],
        [ 3.3647,  0.1649,  2.1474,  0.6164, -1.4752, -1.3498],
        [ 2.3158,  0.2414,  1.4356,  1.5478, -1.6404, -0.3856],
        [ 1.1642,  0.0266, -1.4760,  1.8241, -1.4906, -0.4631],
        [-2.2253, -1.5822, -1.0381,  2.5453,  2.0931,  1.1821],
        [-1.4550, -2.3650, -1.7338,  0.2717,  1.7743,  1.0023],
        [ 0.9797,  1.9555, -1.6416, -2.3055, -0.2009, -0.0111],
        [ 2.1633,  1.5315,  1.7655, -0.0536, -1.1689,  0.4399],
        [-1.8279,  0.0163, -1.2667,  1.0013,  1.3098, -0.1980],
        [-0.2162,  1.3352, -0.6842, -0.6821, -1.3468,  1.0252],
        [-0.7150,  1.3329, -1.4216, -1.4903, -0.5082, -0.8171],
        [ 1.1100,  1.6502, -1.0019, -2.1816, -0.7570, -0.8122],
        [ 2.0429, -1.0849,  1.7401, -1.8022, -0.8400, -1.0764],
        [ 2.1571, -1.0477, -3.0972,  1.2514, -2.5033, -1.4385],
        [-2.4379, -0.5667, -2.4834,  0.7874,  2.1593,  1.7750],
        [-2.6063, -2.7150, -1.3378, -1.4076,  1.8041,  0.3038],
        [-0.2434,  2.4300, -1.8217,  0.5304, -0.1436, -0.9036],
        [ 1.9477,  1.9794,  0.7808,  0.0805, -1.6514, -0.8616]],
       device='cuda:0')
action: tensor([[-0.9263, -0.9481, -0.7906, -0.8302,  0.9645,  0.9403],
        [ 0.9083,  0.1930, -0.1788,  0.7554,  0.8195,  0.7126],
        [ 0.9907,  0.9532,  0.8964,  0.1116, -0.8566, -0.9206],
        [ 0.9793,  0.5143,  0.9723,  0.7790, -0.9091, -0.9738],
        [ 0.9955,  0.0328, -0.9830,  0.9321, -0.9268,  0.2201],
        [-0.9928, -0.9714, -0.9279,  0.9342,  0.9761,  0.9166],
        [-0.9782, -0.8222, -0.9862,  0.0593,  0.9719,  0.9151],
        [ 0.4025,  0.8517, -0.9606, -0.4423,  0.0454, -0.0259],
        [ 0.9553, -0.1357,  0.9838,  0.5772,  0.2445,  0.7100],
        [ 0.9126, -0.4614, -0.1482,  0.4709, -0.8553, -0.1569],
        [ 0.9742, -0.2695,  0.8857,  0.8302, -0.1081, -0.5635],
        [ 0.6920, -0.7104, -0.9019,  0.6098, -0.8811, -0.9615],
        [-0.9766, -0.9593, -0.9493,  0.3897,  0.9627, -0.8054],
        [-0.7863, -0.9945, -0.9227, -0.8279,  0.9717,  0.8804],
        [ 0.9281,  0.8042, -0.9878, -0.9347, -0.8436,  0.9247],
        [ 0.9793,  0.1981,  0.9850,  0.4432, -0.4931, -0.2564],
        [ 0.5081,  0.7654,  0.9845, -0.1261, -0.9677, -0.4041],
        [ 0.9881,  0.5751, -0.3399,  0.0419, -0.9460, -0.4350],
        [-0.9639, -0.8595, -0.9954,  0.4619,  0.9257,  0.0718],
        [-0.9300, -0.9864, -0.9221, -0.5100,  0.9282,  0.5911]],
       device='cuda:0')
squash tensor([[-1.6313, -1.8125, -1.0731, -1.1886,  2.0073,  1.7407],
        [ 1.5175,  0.1954, -0.1808,  0.9854,  1.1552,  0.8925],
        [ 2.6826,  1.8658,  1.4536,  0.1121, -1.2803, -1.5929],
        [ 2.2800,  0.5686,  2.1332,  1.0428, -1.5223, -2.1606],
        [ 3.0449,  0.0328, -2.3786,  1.6743, -1.6354,  0.2238],
        [-2.8147, -2.1166, -1.6430,  1.6901,  2.2076,  1.5670],
        [-2.2541, -1.1635, -2.4831,  0.0594,  2.1252,  1.5582],
        [ 0.4266,  1.2624, -1.9536, -0.4751,  0.0454, -0.0259],
        [ 1.8888, -0.1365,  2.4027,  0.6582,  0.2495,  0.8871],
        [ 1.5430, -0.4990, -0.1493,  0.5112, -1.2758, -0.1582],
        [ 2.1690, -0.2763,  1.4015,  1.1889, -0.1085, -0.6379],
        [ 0.8518, -0.8880, -1.4825,  0.7086, -1.3807, -1.9650],
        [-2.2186, -1.9369, -1.8248,  0.4115,  1.9820, -1.1137],
        [-1.0618, -2.9499, -1.6069, -1.1813,  2.1217,  1.3773],
        [ 1.6442,  1.1104, -2.5467, -1.6947, -1.2334,  1.6203],
        [ 2.2798,  0.2008,  2.4434,  0.4762, -0.5401, -0.2623],
        [ 0.5602,  1.0091,  2.4252, -0.1267, -2.0554, -0.4285],
        [ 2.5572,  0.6552, -0.3540,  0.0420, -1.7918, -0.4661],
        [-1.9988, -1.2914, -3.0343,  0.4998,  1.6276,  0.0720],
        [-1.6586, -2.4926, -1.6026, -0.5628,  1.6449,  0.6793]],
       device='cuda:0')
action: tensor([[-0.9512, -0.9952, -0.9754, -0.8486,  0.9804,  0.9819],
        [ 0.7798,  0.6760, -0.8252,  0.5788,  0.7174, -0.6389],
        [ 0.9994,  0.5057,  0.9850,  0.6464, -0.6747, -0.7299],
        [ 0.9432,  0.4255,  0.9258, -0.2825, -0.9787, -0.8521],
        [ 0.8723,  0.6657, -0.4963,  0.6561, -0.9389, -0.8582],
        [-0.9953, -0.9438, -0.9253,  0.7199,  0.9935,  0.9220],
        [-0.9939, -0.9960, -0.9815, -0.0027,  0.9886,  0.9463],
        [ 0.0814, -0.2053, -0.9258, -0.5503, -0.0634,  0.2908],
        [ 0.9724, -0.2730,  0.9718,  0.6761, -0.0874,  0.9442],
        [ 0.7991, -0.5896,  0.9408, -0.0615, -0.4751,  0.5095],
        [-0.2046,  0.5353,  0.7834,  0.2356,  0.4628, -0.5436],
        [-0.8204,  0.7104, -0.5801, -0.6222,  0.2315,  0.9451],
        [ 0.2819,  0.6750, -0.8440, -0.5821, -0.8692,  0.2601],
        [-0.7532,  0.4553, -0.6348, -0.9787, -0.4628, -0.6450],
        [ 0.9988, -0.3633,  0.9595, -0.9872, -0.9743, -0.8222],
        [ 0.9829, -0.9269,  0.6891,  0.3964, -0.9835, -0.9703],
        [-0.9972, -0.8149, -0.9744,  0.6209,  0.9982,  0.9383],
        [-0.9947, -0.8932, -0.9787, -0.3269,  0.9955,  0.9882],
        [-0.9576, -0.2302, -0.6752,  0.6211,  0.9503,  0.6768],
        [ 0.9523, -0.6752,  0.9569,  0.8795,  0.7837,  0.3671]],
       device='cuda:0')
squash tensor([[-1.8438e+00, -3.0161e+00, -2.1923e+00, -1.2511e+00,  2.3070e+00,
          2.3466e+00],
        [ 1.0448e+00,  8.2174e-01, -1.1729e+00,  6.6058e-01,  9.0229e-01,
         -7.5630e-01],
        [ 4.0710e+00,  5.5695e-01,  2.4432e+00,  7.6909e-01, -8.1924e-01,
         -9.2855e-01],
        [ 1.7660e+00,  4.5442e-01,  1.6282e+00, -2.9042e-01, -2.2649e+00,
         -1.2638e+00],
        [ 1.3424e+00,  8.0301e-01, -5.4438e-01,  7.8588e-01, -1.7289e+00,
         -1.2864e+00],
        [-3.0257e+00, -1.7718e+00, -1.6248e+00,  9.0741e-01,  2.8647e+00,
          1.6020e+00],
        [-2.8919e+00, -3.1083e+00, -2.3373e+00, -2.7490e-03,  2.5819e+00,
          1.7954e+00],
        [ 8.1578e-02, -2.0824e-01, -1.6281e+00, -6.1874e-01, -6.3531e-02,
          2.9942e-01],
        [ 2.1337e+00, -2.8010e-01,  2.1239e+00,  8.2191e-01, -8.7605e-02,
          1.7757e+00],
        [ 1.0961e+00, -6.7707e-01,  1.7451e+00, -6.1625e-02, -5.1668e-01,
          5.6200e-01],
        [-2.0755e-01,  5.9755e-01,  1.0541e+00,  2.4015e-01,  5.0085e-01,
         -6.0930e-01],
        [-1.1581e+00,  8.8807e-01, -6.6265e-01, -7.2851e-01,  2.3572e-01,
          1.7836e+00],
        [ 2.8980e-01,  8.1995e-01, -1.2350e+00, -6.6564e-01, -1.3298e+00,
          2.6623e-01],
        [-9.8027e-01,  4.9135e-01, -7.4933e-01, -2.2647e+00, -5.0087e-01,
         -7.6673e-01],
        [ 3.7040e+00, -3.8072e-01,  1.9396e+00, -2.5241e+00, -2.1701e+00,
         -1.1635e+00],
        [ 2.3759e+00, -1.6362e+00,  8.4633e-01,  4.1932e-01, -2.3935e+00,
         -2.0973e+00],
        [-3.2784e+00, -1.1415e+00, -2.1720e+00,  7.2642e-01,  3.5099e+00,
          1.7234e+00],
        [-2.9623e+00, -1.4375e+00, -2.2647e+00, -3.3932e-01,  3.0462e+00,
          2.5624e+00],
        [-1.9164e+00, -2.3436e-01, -8.2027e-01,  7.2671e-01,  1.8348e+00,
          8.2321e-01],
        [ 1.8562e+00, -8.2033e-01,  1.9074e+00,  1.3734e+00,  1.0548e+00,
          3.8509e-01]], device='cuda:0')
action: tensor([[-0.9733, -0.9348, -0.9144,  0.5518,  0.9843, -0.9231],
        [-0.8489, -0.9918, -0.8457, -0.8062,  0.9797,  0.6365],
        [ 0.7959,  0.8459, -0.9422, -0.8620, -0.2783, -0.3803],
        [ 0.9825,  0.0403,  0.9901,  0.1686, -0.9785, -0.4796],
        [ 0.9950,  0.3819,  0.9704,  0.6649, -0.8696, -0.6767],
        [ 0.8408, -0.8380, -0.9809,  0.9583, -0.6996, -0.5402],
        [-0.9690, -0.8351, -0.9957,  0.8578,  0.9807,  0.5246],
        [-0.9250, -0.9906, -0.9741, -0.9240,  0.9818,  0.7775],
        [ 0.2183,  0.9083, -0.9572, -0.6626, -0.4160,  0.0978],
        [ 0.9608,  0.7377,  0.9056,  0.8753, -0.4178,  0.4872],
        [ 0.8868,  0.4973,  0.9622,  0.3348, -0.7265, -0.4518],
        [ 0.9709,  0.4085,  0.5771,  0.2947, -0.8476, -0.9739],
        [ 0.9473, -0.8209, -0.7402,  0.1228, -0.9531, -0.9436],
        [-0.9660, -0.9746, -0.9785,  0.6720,  0.9549, -0.7935],
        [-0.9842, -0.9901, -0.9705, -0.7336,  0.8754,  0.8750],
        [ 0.9171,  0.8483, -0.8075, -0.7046,  0.1633,  0.7331],
        [ 0.9830,  0.0919,  0.9574,  0.1907, -0.8515,  0.5601],
        [ 0.9712,  0.0365,  0.9774,  0.4829, -0.9341, -0.1986],
        [ 0.7764, -0.7416, -0.7313,  0.9164, -0.9418, -0.8901],
        [-0.9828, -0.9833, -0.7123,  0.3995,  0.9312, -0.4620]],
       device='cuda:0')
squash tensor([[-2.1507, -1.6950, -1.5538,  0.6210,  2.4195, -1.6099],
        [-1.2520, -2.7450, -1.2408, -1.1161,  2.2897,  0.7522],
        [ 1.0874,  1.2416, -1.7570, -1.3010, -0.2858, -0.4004],
        [ 2.3639,  0.0403,  2.6499,  0.1703, -2.2601, -0.5225],
        [ 2.9935,  0.4022,  2.0989,  0.8015, -1.3316, -0.8230],
        [ 1.2238, -1.2143, -2.3217,  1.9243, -0.8665, -0.6045],
        [-2.0755, -1.2047, -3.0667,  1.2848,  2.3156,  0.5827],
        [-1.6228, -2.6790, -2.1666, -1.6156,  2.3458,  1.0391],
        [ 0.2218,  1.5175, -1.9114, -0.7975, -0.4429,  0.0981],
        [ 1.9560,  0.9455,  1.5028,  1.3554, -0.4451,  0.5324],
        [ 1.4066,  0.5458,  1.9741,  0.3482, -0.9213, -0.4869],
        [ 2.1075,  0.4338,  0.6581,  0.3037, -1.2477, -2.1624],
        [ 1.8047, -1.1594, -0.9510,  0.1234, -1.8643, -1.7704],
        [-2.0281, -2.1773, -2.2601,  0.8144,  1.8851, -1.0807],
        [-2.4164, -2.6510, -2.1002, -0.9364,  1.3558,  1.3542],
        [ 1.5704,  1.2502, -1.1199, -0.8763,  0.1648,  0.9353],
        [ 2.3808,  0.0921,  1.9143,  0.1931, -1.2617,  0.6330],
        [ 2.1131,  0.0365,  2.2359,  0.5267, -1.6896, -0.2013],
        [ 1.0362, -0.9540, -0.9316,  1.5661, -1.7538, -1.4225],
        [-2.3738, -2.3893, -0.8917,  0.4230,  1.6675, -0.4999]],
       device='cuda:0')
action: tensor([[-0.9906, -0.9385, -0.8831,  0.5348,  0.8757,  0.3969],
        [-0.4197, -0.9801, -0.9504, -0.4113,  0.9786,  0.7089],
        [ 0.9964, -0.0280, -0.3305,  0.0941,  0.8581,  0.7032],
        [ 0.9951,  0.3969,  0.9972, -0.1500, -0.9635, -0.8815],
        [ 0.9977, -0.0157,  0.9473, -0.3129, -0.9677,  0.6031],
        [ 0.9759,  0.2339, -0.0976,  0.9322, -0.7658, -0.9415],
        [ 0.8168,  0.0634, -0.9247,  0.1547, -0.8757, -0.6761],
        [-0.9912, -0.9778, -0.9866,  0.5562,  0.8577,  0.7585],
        [-0.9885, -0.9495, -0.8448, -0.8279,  0.9115,  0.9280],
        [ 0.8608,  0.4337, -0.7709,  0.0016,  0.7003, -0.1375],
        [ 0.9731,  0.0714,  0.9950,  0.3876, -0.9416, -0.9495],
        [ 0.9344, -0.1675,  0.9607,  0.7955, -0.6559, -0.4259],
        [ 0.9728, -0.6132, -0.8786,  0.9887, -0.9753, -0.2761],
        [-0.9812, -0.9872, -0.9448,  0.6641,  0.9737,  0.3241],
        [-0.9765, -0.9427, -0.9907, -0.2266,  0.9746,  0.8791],
        [ 0.6193,  0.8627, -0.9151, -0.6186, -0.5128,  0.0802],
        [ 0.9579, -0.1431,  0.9741,  0.5578, -0.8700,  0.2745],
        [ 0.9933,  0.2262,  0.9684, -0.0169, -0.9113, -0.5709],
        [ 0.9659, -0.2054,  0.4347,  0.8078, -0.8816, -0.8728],
        [-0.9836, -0.9138, -0.9390,  0.2560,  0.8821,  0.6824]],
       device='cuda:0')
squash tensor([[-2.6751e+00, -1.7256e+00, -1.3898e+00,  5.9689e-01,  1.3572e+00,
          4.1994e-01],
        [-4.4732e-01, -2.3012e+00, -1.8362e+00, -4.3718e-01,  2.2633e+00,
          8.8494e-01],
        [ 3.1633e+00, -2.8047e-02, -3.4339e-01,  9.4384e-02,  1.2861e+00,
          8.7351e-01],
        [ 3.0060e+00,  4.1991e-01,  3.2845e+00, -1.5111e-01, -1.9926e+00,
         -1.3825e+00],
        [ 3.3740e+00, -1.5660e-02,  1.8048e+00, -3.2376e-01, -2.0550e+00,
          6.9796e-01],
        [ 2.2025e+00,  2.3829e-01, -9.7867e-02,  1.6746e+00, -1.0102e+00,
         -1.7510e+00],
        [ 1.1470e+00,  6.3481e-02, -1.6203e+00,  1.5595e-01, -1.3571e+00,
         -8.2183e-01],
        [-2.7091e+00, -2.2453e+00, -2.5010e+00,  6.2733e-01,  1.2845e+00,
          9.9272e-01],
        [-2.5784e+00, -1.8265e+00, -1.2377e+00, -1.1815e+00,  1.5361e+00,
          1.6438e+00],
        [ 1.2963e+00,  4.6444e-01, -1.0226e+00,  1.5536e-03,  8.6790e-01,
         -1.3840e-01],
        [ 2.1483e+00,  7.1545e-02,  2.9931e+00,  4.0898e-01, -1.7519e+00,
         -1.8269e+00],
        [ 1.6918e+00, -1.6913e-01,  1.9548e+00,  1.0862e+00, -7.8559e-01,
         -4.5486e-01],
        [ 2.1414e+00, -7.1409e-01, -1.3698e+00,  2.5872e+00, -2.1918e+00,
         -2.8345e-01],
        [-2.3299e+00, -2.5209e+00, -1.7809e+00,  8.0003e-01,  2.1584e+00,
          3.3624e-01],
        [-2.2155e+00, -1.7619e+00, -2.6845e+00, -2.3057e-01,  2.1767e+00,
          1.3716e+00],
        [ 7.2389e-01,  1.3038e+00, -1.5578e+00, -7.2270e-01, -5.6659e-01,
          8.0327e-02],
        [ 1.9198e+00, -1.4408e-01,  2.1677e+00,  6.2962e-01, -1.3332e+00,
          2.8176e-01],
        [ 2.8487e+00,  2.3019e-01,  2.0660e+00, -1.6917e-02, -1.5350e+00,
         -6.4887e-01],
        [ 2.0274e+00, -2.0835e-01,  4.6569e-01,  1.1207e+00, -1.3829e+00,
         -1.3447e+00],
        [-2.3990e+00, -1.5499e+00, -1.7298e+00,  2.6186e-01,  1.3851e+00,
          8.3354e-01]], device='cuda:0')
action: tensor([[ 0.9679,  0.0568,  0.9976, -0.1239, -0.9117,  0.0440],
        [ 0.9458, -0.5676, -0.3514,  0.8538, -0.9069, -0.7684],
        [-0.7718, -0.9761, -0.9546,  0.7308,  0.9623,  0.7945],
        [-0.9756, -0.9585, -0.9917, -0.8758,  0.9256,  0.7124],
        [ 0.9759,  0.5326, -0.2004,  0.1241,  0.7594,  0.7272],
        [ 0.9890, -0.2162,  0.9844, -0.3229, -0.9247, -0.6480],
        [ 0.9810, -0.6605,  0.9521,  0.6797, -0.8496,  0.2582],
        [ 0.9756, -0.5915, -0.8759,  0.9729, -0.8454, -0.7535],
        [-0.9836, -0.7382, -0.4073,  0.5822,  0.9758, -0.5864],
        [-0.9934, -0.9883, -0.7722, -0.6799,  0.9576,  0.4870],
        [ 0.5381,  0.8031, -0.9119, -0.9165, -0.7677,  0.2433],
        [ 0.9966, -0.1865,  0.8879,  0.4131,  0.4658,  0.7698],
        [ 0.6801, -0.0753,  0.9771, -0.3815, -0.8747, -0.9674],
        [ 0.9862,  0.7455,  0.9772,  0.3949, -0.7527, -0.9393],
        [ 0.8463,  0.1192, -0.4786, -0.0176, -0.9620, -0.9332],
        [-0.9945, -0.9841, -0.9356,  0.6313,  0.9535, -0.1803],
        [-0.9482, -0.9857, -0.9915, -0.9093,  0.9428,  0.4588],
        [ 0.6624,  0.6968, -0.4206, -0.5260,  0.8613,  0.5840],
        [ 0.9973, -0.0838,  0.9866,  0.3678, -0.9448, -0.6725],
        [ 0.9765,  0.6754,  0.8662,  0.0820, -0.9442, -0.9534]],
       device='cuda:0')
squash tensor([[ 2.0577,  0.0569,  3.3689, -0.1245, -1.5377,  0.0440],
        [ 1.7903, -0.6440, -0.3671,  1.2701, -1.5097, -1.0165],
        [-1.0246, -2.2065, -1.8814,  0.9305,  1.9765,  1.0834],
        [-2.1975, -1.9265, -2.7402, -1.3574,  1.6265,  0.8920],
        [ 2.2025,  0.5937, -0.2031,  0.1247,  0.9948,  0.9227],
        [ 2.6006, -0.2196,  2.4226, -0.3349, -1.6207, -0.7718],
        [ 2.3248, -0.7937,  1.8536,  0.8286, -1.2547,  0.2642],
        [ 2.1965, -0.6799, -1.3579,  2.1447, -1.2397, -0.9811],
        [-2.3968, -0.9464, -0.4323,  0.6657,  2.2020, -0.6722],
        [-2.8590, -2.5679, -1.0258, -0.8290,  1.9160,  0.5321],
        [ 0.6015,  1.1073, -1.5389, -1.5669, -1.0147,  0.2483],
        [ 3.1841, -0.1887,  1.4120,  0.4394,  0.5048,  1.0198],
        [ 0.8292, -0.0755,  2.2296, -0.4018, -1.3529, -2.0507],
        [ 2.4830,  0.9628,  2.2306,  0.4176, -0.9792, -1.7321],
        [ 1.2430,  0.1197, -0.5212, -0.0177, -1.9718, -1.6824],
        [-2.9437, -2.4146, -1.7013,  0.7435,  1.8687, -0.1823],
        [-1.8140, -2.4668, -2.7298, -1.5237,  1.7631,  0.4958],
        [ 0.7970,  0.8610, -0.4484, -0.5845,  1.2984,  0.6686],
        [ 3.3113, -0.0840,  2.4991,  0.3859, -1.7807, -0.8153],
        [ 2.2161,  0.8206,  1.3176,  0.0822, -1.7758, -1.8679]],
       device='cuda:0')
action: tensor([[-0.9927, -0.9705, -0.8354,  0.9840,  0.9784,  0.9036],
        [-0.9504, -0.9811, -0.8938, -0.0596,  0.9634,  0.4858],
        [-0.5675,  0.8739, -0.6678, -0.9753, -0.3833,  0.7595],
        [ 0.9835,  0.6768,  0.9774,  0.8412, -0.6906,  0.3245],
        [-0.9977,  0.9761, -0.9324, -0.8389, -0.2273,  0.6333],
        [ 0.9210,  0.9480, -0.9964, -0.8901,  0.1943,  0.7286],
        [ 0.9923, -0.6251,  0.9880, -0.8250, -0.9856, -0.9662],
        [ 0.9962,  0.9305, -0.8745,  0.1185, -0.9349, -0.7107],
        [-0.9787, -0.6952, -0.7514,  0.3870,  0.8995,  0.8373],
        [-0.9673, -0.8912, -0.9747, -0.3439,  0.9841,  0.9391],
        [ 0.8125, -0.2326,  0.4056,  0.6016,  0.9140,  0.0254],
        [ 0.9946, -0.4834,  0.9768,  0.8491, -0.8901, -0.5485],
        [ 0.9732,  0.0537,  0.9738,  0.4130, -0.9766, -0.9829],
        [ 0.9986,  0.2271,  0.3305,  0.9234, -0.9822, -0.0872],
        [-0.9123, -0.7393, -0.9753,  0.8803,  0.0913,  0.8926],
        [-0.9977, -0.9890, -0.9862,  0.2773,  0.9841,  0.9574],
        [ 0.6004, -0.2726, -0.2033,  0.2312,  0.7734,  0.5287],
        [ 0.9961,  0.7170,  0.9923,  0.8818,  0.4001, -0.3756],
        [ 0.9662, -0.0835,  0.8857,  0.7435, -0.9884, -0.4829],
        [ 0.9562,  0.7084,  0.3488,  0.2531, -0.9677, -0.2075]],
       device='cuda:0')
squash tensor([[-2.8048, -2.1000, -1.2057,  2.4100,  2.2590,  1.4916],
        [-1.8359, -2.3273, -1.4406, -0.0597,  1.9905,  0.5305],
        [-0.6438,  1.3493, -0.8067, -2.1901, -0.4039,  0.9949],
        [ 2.3957,  0.8231,  2.2350,  1.2254, -0.8492,  0.3367],
        [-3.3840,  2.2081, -1.6763, -1.2174, -0.2313,  0.7469],
        [ 1.5953,  1.8119, -3.1560, -1.4224,  0.1968,  0.9258],
        [ 2.7772, -0.7333,  2.5535, -1.1722, -2.4642, -2.0315],
        [ 3.1362,  1.6619, -1.3520,  0.1191, -1.6963, -0.8886],
        [-2.2662, -0.8579, -0.9761,  0.4083,  1.4695,  1.2122],
        [-2.0484, -1.4276, -2.1788, -0.3585,  2.4125,  1.7303],
        [ 1.1344, -0.2369,  0.4304,  0.6957,  1.5514,  0.0254],
        [ 2.9535, -0.5274,  2.2236,  1.2529, -1.4224, -0.6162],
        [ 2.1496,  0.0538,  2.1612,  0.4393, -2.2190, -2.3752],
        [ 3.6167,  0.2312,  0.3434,  1.6113, -2.3559, -0.0874],
        [-1.5411, -0.9490, -2.1901,  1.3771,  0.0916,  1.4346],
        [-3.3816, -2.5976, -2.4863,  0.2847,  2.4144,  1.9135],
        [ 0.6938, -0.2797, -0.2061,  0.2354,  1.0287,  0.5884],
        [ 3.1146,  0.9014,  2.7753,  1.3840,  0.4238, -0.3949],
        [ 2.0317, -0.0837,  1.4017,  0.9583, -2.5702, -0.5268],
        [ 1.8996,  0.8839,  0.3640,  0.2587, -2.0546, -0.2105]],
       device='cuda:0')
action: tensor([[-0.9847, -0.9305, -0.9791, -0.0773,  0.9746,  0.6023],
        [ 0.5992, -0.2832, -0.4200,  0.4498,  0.4582,  0.8019],
        [ 0.9908, -0.0290,  0.9761,  0.5413, -0.8942,  0.0679],
        [ 0.9858, -0.0705,  0.9834, -0.4588, -0.9386, -0.5776],
        [ 0.9953,  0.6977,  0.9909,  0.2012, -0.4551, -0.7386],
        [ 0.9366,  0.6220, -0.4982, -0.2578, -0.8990, -0.8007],
        [-0.9795, -0.9536, -0.9359, -0.1508,  0.8517,  0.0343],
        [-0.9310, -0.9880, -0.9690, -0.6899,  0.9896,  0.8906],
        [ 0.8462,  0.2737, -0.2877, -0.3869,  0.7586,  0.1322],
        [ 0.9929, -0.7073,  0.9602, -0.2095, -0.8448, -0.6009],
        [ 0.9091, -0.3350,  0.9739,  0.2943, -0.5955,  0.2211],
        [ 0.9661, -0.3667,  0.6982,  0.8230, -0.9510, -0.9011],
        [ 0.5680, -0.4290, -0.7173,  0.4974, -0.9450, -0.8824],
        [-0.9776, -0.6657, -0.8889,  0.5445,  0.9052,  0.7870],
        [-0.9118, -0.9886, -0.9853, -0.8612,  0.9414,  0.8547],
        [ 0.3510,  0.8130, -0.9534, -0.2693,  0.2763, -0.5996],
        [ 0.9620,  0.3005,  0.9485,  0.4218, -0.8675,  0.6439],
        [ 0.9800,  0.1814,  0.9856,  0.2515, -0.9281, -0.4846],
        [ 0.9892,  0.1140, -0.7041,  0.6603, -0.9767, -0.9488],
        [-0.9916, -0.8262, -0.8108,  0.4275,  0.9698,  0.5646]],
       device='cuda:0')
squash tensor([[-2.4342, -1.6618, -2.2756, -0.0774,  2.1764,  0.6968],
        [ 0.6918, -0.2912, -0.4477,  0.4845,  0.4951,  1.1040],
        [ 2.6891, -0.0290,  2.2077,  0.6060, -1.4426,  0.0680],
        [ 2.4707, -0.0706,  2.3917, -0.4958, -1.7258, -0.6588],
        [ 3.0272,  0.8627,  2.6939,  0.2040, -0.4911, -0.9474],
        [ 1.7099,  0.7283, -0.5470, -0.2638, -1.4672, -1.1006],
        [-2.2850, -1.8698, -1.7041, -0.1520,  1.2625,  0.0343],
        [-1.6656, -2.5570, -2.0760, -0.8477,  2.6293,  1.4251],
        [ 1.2426,  0.2809, -0.2961, -0.4081,  0.9929,  0.1330],
        [ 2.8191, -0.8817,  1.9487, -0.2127, -1.2378, -0.6946],
        [ 1.5225, -0.3484,  2.1620,  0.3033, -0.6862,  0.2248],
        [ 2.0303, -0.3846,  0.8638,  1.1661, -1.8419, -1.4778],
        [ 0.6446, -0.4586, -0.9020,  0.5459, -1.7832, -1.3864],
        [-2.2402, -0.8030, -1.4166,  0.6106,  1.5002,  1.0635],
        [-1.5382, -2.5791, -2.4533, -1.2978,  1.7501,  1.2733],
        [ 0.3666,  1.1357, -1.8679, -0.2761,  0.2837, -0.6925],
        [ 1.9726,  0.3100,  1.8167,  0.4499, -1.3228,  0.7648],
        [ 2.2983,  0.1834,  2.4644,  0.2570, -1.6444, -0.5290],
        [ 2.6098,  0.1145, -0.8753,  0.7934, -2.2193, -1.8196],
        [-2.7332, -1.1760, -1.1294,  0.4569,  2.0892,  0.6396]],
       device='cuda:0')
action: tensor([[-0.0928,  0.2555, -0.9889, -0.3341,  0.9192,  0.4973],
        [ 0.9772, -0.1381,  0.9173,  0.7164, -0.1399,  0.7012],
        [ 0.9831, -0.4696,  0.9901, -0.4174, -0.6246, -0.1955],
        [ 0.9919,  0.6323,  0.9895,  0.4668, -0.8115, -0.7773],
        [ 0.9357,  0.1780, -0.1766,  0.3925, -0.9006, -0.9623],
        [-0.9890, -0.9347, -0.9448, -0.0574,  0.9603, -0.8901],
        [-0.8603, -0.9774, -0.8862, -0.7943,  0.9799,  0.6065],
        [ 0.6466,  0.6373, -0.3728, -0.3639,  0.8342, -0.0362],
        [ 0.9340, -0.6562,  0.9873,  0.1364, -0.9214, -0.7586],
        [ 0.9881,  0.3383,  0.8515,  0.7278, -0.9843, -0.8600],
        [ 0.9951, -0.5343, -0.8795,  0.9624, -0.9779,  0.0943],
        [-0.9801, -0.9765, -0.9495,  0.9929,  0.9054,  0.9534],
        [-0.9745, -0.9911, -0.8224, -0.0187,  0.9117,  0.9947],
        [ 0.9104,  0.9573, -0.9285, -0.1247,  0.6504,  0.4440],
        [ 0.9847, -0.1692,  0.8583,  0.5581, -0.5738,  0.5083],
        [ 0.8547, -0.2919,  0.8785, -0.0517, -0.9191, -0.3157],
        [ 0.9941,  0.6237,  0.9113,  0.5568, -0.9390, -0.9007],
        [ 0.9733, -0.2328, -0.2459,  0.4344, -0.9592, -0.8371],
        [-0.9841, -0.9617, -0.8528,  0.3223,  0.9296,  0.3254],
        [-0.9334, -0.9930, -0.9496, -0.4958,  0.8786,  0.4447]],
       device='cuda:0')
squash tensor([[-0.0931,  0.2613, -2.5948, -0.3474,  1.5841,  0.5457],
        [ 2.2321, -0.1390,  1.5720,  0.9001, -0.1408,  0.8697],
        [ 2.3815, -0.5096,  2.6538, -0.4446, -0.7326, -0.1980],
        [ 2.7555,  0.7453,  2.6215,  0.5060, -1.1314, -1.0386],
        [ 1.7021,  0.1799, -0.1785,  0.4147, -1.4752, -1.9761],
        [-2.5998, -1.6944, -1.7813, -0.0574,  1.9499, -1.4224],
        [-1.2947, -2.2360, -1.4040, -1.0829,  2.2953,  0.7033],
        [ 0.7695,  0.7536, -0.3917, -0.3814,  1.2019, -0.0362],
        [ 1.6890, -0.7860,  2.5247,  0.1372, -1.5980, -0.9929],
        [ 2.5584,  0.3521,  1.2616,  0.9241, -2.4193, -1.2933],
        [ 3.0051, -0.5961, -1.3734,  1.9779, -2.2478,  0.0946],
        [-2.2989, -2.2170, -1.8271,  2.8180,  1.5013,  1.8682],
        [-2.1741, -2.7035, -1.1642, -0.0187,  1.5375,  2.9646],
        [ 1.5297,  1.9128, -1.6477, -0.1253,  0.7760,  0.4772],
        [ 2.4317, -0.1708,  1.2869,  0.6301, -0.6532,  0.5604],
        [ 1.2733, -0.3007,  1.3691, -0.0517, -1.5835, -0.3269],
        [ 2.9125,  0.7311,  1.5354,  0.6281, -1.7296, -1.4758],
        [ 2.1514, -0.2372, -0.2510,  0.4654, -1.9362, -1.2116],
        [-2.4130, -1.9684, -1.2665,  0.3342,  1.6552,  0.3376],
        [-1.6842, -2.8232, -1.8277, -0.5437,  1.3696,  0.4781]],
       device='cuda:0')
action: tensor([[ 0.9806,  0.9512, -0.8272, -0.9569, -0.8939, -0.4663],
        [ 0.9734, -0.7049,  0.9455, -0.9313, -0.7355, -0.4697],
        [ 0.9562,  0.7124, -0.8481,  0.6138, -0.9503, -0.9051],
        [-0.9775, -0.9919, -0.9658,  0.7176,  0.9879,  0.9853],
        [-0.9141, -0.9826, -0.9028, -0.9574,  0.9150,  0.9671],
        [ 0.7013,  0.2622, -0.3541,  0.7778,  0.7795,  0.5647],
        [ 0.9935,  0.4429,  0.9607,  0.7058, -0.9643, -0.8600],
        [ 0.9906,  0.5301,  0.7026,  0.2648, -0.9160, -0.4563],
        [ 0.9871, -0.2035, -0.7908,  0.9542, -0.9514, -0.5027],
        [-0.9984, -0.9469, -0.8474,  0.8915,  0.9712,  0.9476],
        [-0.9789, -0.9932, -0.9598,  0.1242,  0.9763,  0.8250],
        [ 0.9282,  0.5109, -0.7488, -0.8826,  0.4495,  0.7811],
        [ 0.9730, -0.3049,  0.9971,  0.6767, -0.3153,  0.6481],
        [-0.9359, -0.0501,  0.0298,  0.5795,  0.3874,  0.6537],
        [-0.8429,  0.8823, -0.7363, -0.6454,  0.0970,  0.9315],
        [ 0.6790,  0.5608, -0.9108, -0.8187, -0.6775, -0.8396],
        [ 0.9699, -0.6426,  0.7859, -0.9198, -0.9703, -0.8780],
        [ 0.9953, -0.8492, -0.4431,  0.6159, -0.9901, -0.8617],
        [-0.9817, -0.9868, -0.9389,  0.4533,  0.9752,  0.9552],
        [-0.9807, -0.9911, -0.9127, -0.4098,  0.9825,  0.9814]],
       device='cuda:0')
squash tensor([[ 2.3127,  1.8441, -1.1792, -1.9076, -1.4408, -0.5054],
        [ 2.1531, -0.8769,  1.7874, -1.6684, -0.9406, -0.5096],
        [ 1.8991,  0.8920, -1.2494,  0.7150, -1.8352, -1.4995],
        [-2.2378, -2.7530, -2.0262,  0.9026,  2.5526,  2.4537],
        [-1.5517, -2.3680, -1.4874, -1.9139,  1.5574,  2.0455],
        [ 0.8699,  0.2684, -0.3702,  1.0398,  1.0441,  0.6397],
        [ 2.8628,  0.4758,  1.9551,  0.8788, -2.0045, -1.2932],
        [ 2.6783,  0.5902,  0.8725,  0.2713, -1.5633, -0.4927],
        [ 2.5203, -0.2063, -1.0736,  1.8768, -1.8467, -0.5529],
        [-3.5773, -1.8005, -1.2468,  1.4291,  2.1134,  1.8076],
        [-2.2695, -2.8439, -1.9437,  0.1248,  2.2125,  1.1721],
        [ 1.6455,  0.5639, -0.9702, -1.3873,  0.4841,  1.0483],
        [ 2.1451, -0.3149,  3.2714,  0.8230, -0.3264,  0.7721],
        [-1.7042, -0.0502,  0.0298,  0.6617,  0.4087,  0.7818],
        [-1.2312,  1.3859, -0.9423, -0.7674,  0.0973,  1.6695],
        [ 0.8272,  0.6340, -1.5322, -1.1528, -0.8244, -1.2199],
        [ 2.0914, -0.7626,  1.0607, -1.5878, -2.0968, -1.3668],
        [ 3.0246, -1.2532, -0.4761,  0.7184, -2.6492, -1.2998],
        [-2.3416, -2.5067, -1.7287,  0.4888,  2.1887,  1.8875],
        [-2.3143, -2.7071, -1.5432, -0.4354,  2.3642,  2.3353]],
       device='cuda:0')
action: tensor([[ 0.9798, -0.2396,  0.8823,  0.3252, -0.6988, -0.1901],
        [ 0.9823, -0.3866,  0.9706,  0.5076, -0.7769, -0.8352],
        [ 0.9014, -0.8565, -0.6159,  0.8578, -0.7548, -0.8338],
        [-0.9853, -0.9127, -0.9110,  0.5242,  0.9750, -0.6937],
        [-0.9505, -0.9800, -0.9274, -0.6729,  0.9060,  0.7593],
        [ 0.6743,  0.7146, -0.8107, -0.7938,  0.0411, -0.0255],
        [ 0.9945, -0.4854,  0.9903,  0.2480, -0.9468, -0.5458],
        [ 0.9945,  0.3930,  0.9860, -0.1113, -0.9829, -0.9419],
        [ 0.9712,  0.0936, -0.9689,  0.9165, -0.9168, -0.1966],
        [-0.9955, -0.9840, -0.9668,  0.6713,  0.9566,  0.8340],
        [-0.9939, -0.9660, -0.9912, -0.4809,  0.9340,  0.9311],
        [ 0.9074,  0.7092, -0.9616, -0.3237,  0.1332,  0.5335],
        [ 0.9615, -0.6032,  0.9750,  0.5397, -0.9413,  0.0263],
        [ 0.9663,  0.5586,  0.9978,  0.0911, -0.7916,  0.4532],
        [ 0.9922,  0.3247,  0.8598, -0.1485, -0.8472, -0.9488],
        [ 0.9642,  0.1433, -0.5009, -0.0089, -0.8686, -0.9819],
        [-0.9548, -0.9142, -0.9833,  0.1867,  0.8934, -0.5728],
        [-0.9890, -0.9829, -0.9741, -0.6810,  0.9886,  0.8633],
        [ 0.9406,  0.0716, -0.7545, -0.4483,  0.7792, -0.2117],
        [ 0.9979,  0.0215,  0.9896,  0.0540, -0.9782, -0.0390]],
       device='cuda:0')
squash tensor([[ 2.2923, -0.2444,  1.3860,  0.3374, -0.8650, -0.1925],
        [ 2.3590, -0.4078,  2.1019,  0.5595, -1.0376, -1.2050],
        [ 1.4797, -1.2801, -0.7184,  1.2851, -0.9841, -1.2004],
        [-2.4520, -1.5433, -1.5331,  0.5821,  2.1847, -0.8551],
        [-1.8369, -2.2983, -1.6396, -0.8161,  1.5046,  0.9944],
        [ 0.8186,  0.8965, -1.1291, -1.0816,  0.0412, -0.0255],
        [ 2.9445, -0.5300,  2.6612,  0.2533, -1.7999, -0.6123],
        [ 2.9499,  0.4153,  2.4758, -0.1117, -2.3756, -1.7551],
        [ 2.1136,  0.0939, -2.0747,  1.5670, -1.5683, -0.1992],
        [-3.0476, -2.4095, -2.0401,  0.8131,  1.9040,  1.2011],
        [-2.8950, -2.0287, -2.7094, -0.5242,  1.6892,  1.6666],
        [ 1.5127,  0.8857, -1.9665, -0.3358,  0.1340,  0.5950],
        [ 1.9650, -0.6981,  2.1851,  0.6038, -1.7492,  0.0263],
        [ 2.0330,  0.6308,  3.4151,  0.0913, -1.0757,  0.4888],
        [ 2.7687,  0.3369,  1.2925, -0.1496, -1.2462, -1.8200],
        [ 2.0025,  0.1443, -0.5504, -0.0089, -1.3273, -2.3466],
        [-1.8831, -1.5527, -2.3878,  0.1889,  1.4386, -0.6517],
        [-2.5975, -2.3763, -2.1662, -0.8310,  2.5798,  1.3060],
        [ 1.7432,  0.0718, -0.9832, -0.4825,  1.0434, -0.2150],
        [ 3.4308,  0.0215,  2.6257,  0.0541, -2.2541, -0.0390]],
       device='cuda:0')
action: tensor([[ 0.7345,  0.8114, -0.9569, -0.6682,  0.4903,  0.8230],
        [ 0.9784,  0.0206,  0.9841,  0.5685, -0.5736, -0.4346],
        [ 0.9770,  0.4244,  0.9796,  0.7038, -0.5623, -0.7011],
        [ 0.9908,  0.0608, -0.4813,  0.5709, -0.9794, -0.9044],
        [-0.9942, -0.9970, -0.9800,  0.6749,  0.8674, -0.8752],
        [-0.9890, -0.9822, -0.9807, -0.6805,  0.8708,  0.7968],
        [ 0.4419,  0.9201, -0.9781, -0.9505,  0.3750,  0.1651],
        [ 0.9888,  0.0591,  0.9968, -0.1477, -0.6710,  0.2950],
        [ 0.9668,  0.6565,  0.9684,  0.4059, -0.9273, -0.5659],
        [ 0.8412, -0.5999, -0.8911,  0.9458, -0.9503, -0.2247],
        [-0.9929, -0.9533, -0.9807,  0.6903,  0.9713,  0.6236],
        [-0.9717, -0.9923, -0.9431, -0.6384,  0.9612,  0.3325],
        [ 0.4756,  0.7457, -0.9207, -0.8602, -0.3407, -0.1711],
        [ 0.8945, -0.3237,  0.9847,  0.7886,  0.1124,  0.0246],
        [ 0.9906,  0.6953,  0.9073,  0.0238, -0.9048,  0.6858],
        [ 0.9943,  0.1225, -0.0276,  0.5187, -0.8178, -0.7138],
        [ 0.9843, -0.2234, -0.8267, -0.0537, -0.9300, -0.7278],
        [-0.9565, -0.9792, -0.9673,  0.6838,  0.9170, -0.5707],
        [-0.9894, -0.9957, -0.9443, -0.7560,  0.9307,  0.8815],
        [ 0.2345,  0.9669, -0.8162, -0.9141, -0.6584,  0.3258]],
       device='cuda:0')
squash tensor([[ 0.9383,  1.1310, -1.9079, -0.8075,  0.5365,  1.1660],
        [ 2.2593,  0.0206,  2.4148,  0.6453, -0.6528, -0.4655],
        [ 2.2265,  0.4531,  2.2879,  0.8747, -0.6362, -0.8694],
        [ 2.6908,  0.0609, -0.5247,  0.6489, -2.2817, -1.4961],
        [-2.9173, -3.2553, -2.2964,  0.8197,  1.3225, -1.3547],
        [-2.5973, -2.3562, -2.3167, -0.8301,  1.3365,  1.0899],
        [ 0.4746,  1.5895, -2.2527, -1.8374,  0.3942,  0.1667],
        [ 2.5877,  0.0592,  3.2153, -0.1487, -0.8125,  0.3040],
        [ 2.0413,  0.7867,  2.0653,  0.4307, -1.6385, -0.6415],
        [ 1.2254, -0.6930, -1.4270,  1.7901, -1.8347, -0.2286],
        [-2.8169, -1.8669, -2.3142,  0.8485,  2.1148,  0.7309],
        [-2.1211, -2.7796, -1.7650, -0.7555,  1.9612,  0.3456],
        [ 0.5173,  0.9632, -1.5937, -1.2942, -0.3549, -0.1728],
        [ 1.4439, -0.3358,  2.4317,  1.0678,  0.1129,  0.0246],
        [ 2.6774,  0.8581,  1.5122,  0.0239, -1.4978,  0.8400],
        [ 2.9326,  0.1231, -0.0276,  0.5746, -1.1502, -0.8949],
        [ 2.4197, -0.2273, -1.1776, -0.0537, -1.6587, -0.9241],
        [-1.9026, -2.2783, -2.0481,  0.8363,  1.5696, -0.6485],
        [-2.6162, -3.0732, -1.7761, -0.9869,  1.6633,  1.3824],
        [ 0.2389,  2.0416, -1.1453, -1.5520, -0.7899,  0.3381]],
       device='cuda:0')
action: tensor([[ 5.7616e-01,  1.1840e-01,  6.3228e-02,  2.6001e-01,  7.9482e-01,
          3.7799e-01],
        [ 9.0858e-01,  8.2547e-01,  7.7337e-01,  5.0217e-01, -9.6342e-01,
         -9.5448e-01],
        [ 9.9293e-01,  1.4696e-01,  9.2494e-01,  9.3539e-01, -9.1906e-01,
         -5.6029e-01],
        [ 7.6673e-01, -7.9813e-01, -9.8352e-01,  9.9062e-01, -8.6389e-01,
         -1.6139e-01],
        [-9.9597e-01, -9.6093e-01, -9.0397e-01,  9.8957e-01,  8.7711e-01,
          9.5382e-01],
        [-9.9142e-01, -9.3368e-01, -9.7397e-01, -5.8605e-02,  9.0365e-01,
          6.9180e-01],
        [-3.2358e-01,  9.6269e-01, -6.9016e-01, -9.9742e-01, -7.2137e-01,
          2.6133e-01],
        [ 7.6075e-01,  7.6297e-01,  9.8487e-01,  5.3927e-01, -7.7407e-01,
         -5.8148e-01],
        [-8.7328e-01,  9.8441e-02, -8.2355e-01,  3.4010e-01,  6.0249e-01,
          4.4758e-01],
        [-8.0584e-01,  9.8466e-01, -7.9171e-01, -8.3648e-01, -5.0914e-01,
         -1.8394e-01],
        [ 9.7083e-01,  9.8241e-01, -8.7221e-01, -9.7032e-01, -8.3772e-01,
         -4.0714e-01],
        [ 9.9772e-01, -4.6008e-01,  9.4717e-01, -9.8513e-01, -9.0325e-01,
         -9.8470e-01],
        [ 9.9419e-01,  6.1432e-01,  1.6376e-01,  3.4013e-01, -9.6047e-01,
         -9.8297e-01],
        [-5.1723e-01, -5.8373e-01, -7.4394e-01,  4.0284e-01,  2.1006e-01,
          4.8184e-01],
        [-9.8699e-01, -9.4056e-01, -9.7744e-01,  7.1321e-04,  9.8709e-01,
          9.4146e-01],
        [ 2.6657e-01, -5.5993e-01, -4.7445e-01,  4.5938e-01,  9.7535e-01,
          8.9017e-01],
        [ 8.9428e-01,  9.0234e-01,  9.6841e-01,  3.8542e-01, -7.9443e-01,
         -5.3458e-01],
        [ 9.7189e-01,  4.8330e-01,  9.3882e-01,  5.3774e-01, -9.8906e-01,
         -8.9378e-01],
        [ 9.6880e-01,  8.7366e-01,  9.3935e-01,  8.9559e-01, -9.7296e-01,
         -9.6140e-01],
        [ 9.7503e-01,  3.1606e-01, -8.7414e-01,  5.6445e-01, -9.0052e-01,
          4.9689e-01]], device='cuda:0')
squash tensor([[ 6.5670e-01,  1.1896e-01,  6.3313e-02,  2.6612e-01,  1.0844e+00,
          3.9771e-01],
        [ 1.5193e+00,  1.1738e+00,  1.0287e+00,  5.5221e-01, -1.9915e+00,
         -1.8799e+00],
        [ 2.8208e+00,  1.4803e-01,  1.6222e+00,  1.6998e+00, -1.5830e+00,
         -6.3326e-01],
        [ 1.0124e+00, -1.0934e+00, -2.3952e+00,  2.6791e+00, -1.3085e+00,
         -1.6281e-01],
        [-3.1024e+00, -1.9579e+00, -1.4935e+00,  2.6254e+00,  1.3631e+00,
          1.8725e+00],
        [-2.7237e+00, -1.6863e+00, -2.1644e+00, -5.8672e-02,  1.4918e+00,
          8.5140e-01],
        [-3.3564e-01,  1.9815e+00, -8.4827e-01, -3.3260e+00, -9.1050e-01,
          2.6754e-01],
        [ 9.9800e-01,  1.0033e+00,  2.4384e+00,  6.0312e-01, -1.0304e+00,
         -6.6470e-01],
        [-1.3467e+00,  9.8761e-02, -1.1677e+00,  3.5421e-01,  6.9704e-01,
          4.8167e-01],
        [-1.1150e+00,  2.4315e+00, -1.0760e+00, -1.2093e+00, -5.6157e-01,
         -1.8606e-01],
        [ 2.1065e+00,  2.3624e+00, -1.3422e+00, -2.0977e+00, -1.2135e+00,
         -4.3218e-01],
        [ 3.3875e+00, -4.9741e-01,  1.8035e+00, -2.4472e+00, -1.4896e+00,
         -2.4327e+00],
        [ 2.9192e+00,  7.1584e-01,  1.6525e-01,  3.5424e-01, -1.9520e+00,
         -2.3786e+00],
        [-5.7255e-01, -6.6810e-01, -9.5925e-01,  4.2703e-01,  2.1323e-01,
          5.2538e-01],
        [-2.5145e+00, -1.7429e+00, -2.2367e+00,  7.1321e-04,  2.5184e+00,
          1.7508e+00],
        [ 2.7316e-01, -6.3273e-01, -5.1580e-01,  4.9652e-01,  2.1919e+00,
          1.4228e+00],
        [ 1.4429e+00,  1.4847e+00,  2.0661e+00,  4.0641e-01, -1.0833e+00,
         -5.9654e-01],
        [ 2.1253e+00,  5.2729e-01,  1.7280e+00,  6.0098e-01, -2.6013e+00,
         -1.4404e+00],
        [ 2.0724e+00,  1.3483e+00,  1.7325e+00,  1.4495e+00, -2.1449e+00,
         -1.9641e+00],
        [ 2.1853e+00,  3.2726e-01, -1.3504e+00,  6.3934e-01, -1.4750e+00,
          5.4517e-01]], device='cuda:0')
action: tensor([[-0.9533, -0.9980, -0.6467,  0.8118,  0.9708, -0.9576],
        [-0.9841, -0.9685, -0.8082, -0.9702,  0.8563,  0.2163],
        [-0.4836,  0.8051, -0.9299, -0.9995,  0.3021,  0.9080],
        [ 0.9696,  0.7210,  0.9699, -0.0297, -0.9284, -0.8817],
        [ 0.9945,  0.8610,  0.9560,  0.5737, -0.9152, -0.9503],
        [ 0.9633,  0.0838, -0.9266,  0.9394, -0.9480, -0.9319],
        [-0.9927, -0.8211, -0.9742,  0.6708,  0.9650,  0.8941],
        [-0.8651, -0.9531, -0.9178, -0.1744,  0.9583,  0.8051],
        [ 0.9034,  0.5692, -0.9485, -0.5528,  0.4763,  0.7914],
        [ 0.9928, -0.1133,  0.9669,  0.5439, -0.6320, -0.2928],
        [ 0.9591, -0.6196,  0.9969,  0.6646, -0.9445,  0.4693],
        [ 0.9650, -0.5122, -0.8862,  0.9816, -0.9547, -0.8908],
        [-0.9890, -0.9605, -0.9839,  0.6213,  0.7970, -0.1534],
        [-0.9779, -0.9351, -0.9761, -0.2041,  0.9783,  0.5831],
        [ 0.0618,  0.8483, -0.7468, -0.7707, -0.0473,  0.3563],
        [ 0.9866, -0.0350,  0.9991,  0.7615, -0.2758, -0.9201],
        [ 0.9109, -0.0063,  0.9240, -0.1884, -0.5343, -0.2665],
        [ 0.9847,  0.1380,  0.9034,  0.5685, -0.7720, -0.9325],
        [ 0.9604, -0.2039, -0.9513,  0.0975, -0.9860, -0.9868],
        [-0.9847, -0.9179, -0.9944,  0.5728,  0.8165, -0.6916]],
       device='cuda:0')
squash tensor([[-1.8664, -3.4575, -0.7696,  1.1323,  2.1055, -1.9156],
        [-2.4120, -2.0675, -1.1217, -2.0954,  1.2794,  0.2198],
        [-0.5277,  1.1130, -1.6573, -4.1781,  0.3118,  1.5163],
        [ 2.0853,  0.9097,  2.0900, -0.0297, -1.6467, -1.3834],
        [ 2.9477,  1.2971,  1.8969,  0.6531, -1.5584, -1.8353],
        [ 1.9903,  0.0839, -1.6339,  1.7331, -1.8117, -1.6726],
        [-2.8065, -1.1602, -2.1689,  0.8121,  2.0137,  1.4418],
        [-1.3131, -1.8643, -1.5747, -0.1762,  1.9243,  1.1130],
        [ 1.4902,  0.6463, -1.8171, -0.6224,  0.5181,  1.0751],
        [ 2.8141, -0.1138,  2.0426,  0.6097, -0.7447, -0.3016],
        [ 1.9341, -0.7243,  3.2389,  0.8011, -1.7784,  0.5092],
        [ 2.0134, -0.5657, -1.4040,  2.3387, -1.8823, -1.4257],
        [-2.5975, -1.9529, -2.4075,  0.7271,  1.0902, -0.1546],
        [-2.2467, -1.6978, -2.2076, -0.2071,  2.2566,  0.6672],
        [ 0.0619,  1.2500, -0.9657, -1.0221, -0.0473,  0.3727],
        [ 2.4992, -0.0351,  3.8535,  0.9998, -0.2831, -1.5894],
        [ 1.5331, -0.0063,  1.6156, -0.1907, -0.5961, -0.2731],
        [ 2.4331,  0.1389,  1.4903,  0.6453, -1.0252, -1.6772],
        [ 1.9510, -0.2068, -1.8453,  0.0978, -2.4771, -2.5076],
        [-2.4327, -1.5752, -2.9342,  0.6517,  1.1463, -0.8510]],
       device='cuda:0')
action: tensor([[-0.9616, -0.9564, -0.9748,  0.5252,  0.9928,  0.7625],
        [-0.9402, -0.9801, -0.9665, -0.3488,  0.9763,  0.9858],
        [ 0.9169,  0.4747, -0.8117,  0.4485,  0.7745,  0.7960],
        [ 0.9640, -0.4271,  0.9580,  0.2756, -0.9320, -0.7548],
        [ 0.9660, -0.4319,  0.9895, -0.0011, -0.8695, -0.7762],
        [ 0.9975,  0.1131,  0.8827,  0.7220, -0.9696, -0.9109],
        [ 0.6441,  0.0118, -0.7665,  0.2495, -0.9717, -0.9887],
        [-0.9846, -0.9885, -0.9725,  0.8204,  0.9571,  0.7540],
        [-0.9344, -0.9726, -0.9692, -0.8782,  0.9686,  0.8791],
        [ 0.2814,  0.7175, -0.9634, -0.1055, -0.2955,  0.0749],
        [ 0.9726,  0.4635,  0.9185,  0.6927, -0.8886, -0.6083],
        [ 0.9592,  0.6862,  0.9861,  0.1952, -0.9735,  0.0737],
        [ 0.9747,  0.2417, -0.5899,  0.8356, -0.8725, -0.9114],
        [-0.9953, -0.8557, -0.9420,  0.6299,  0.9112,  0.7880],
        [-0.8865, -0.9748, -0.9623, -0.6667,  0.5480,  0.7237],
        [ 0.8852,  0.6343, -0.9871, -0.5017,  0.8104,  0.2312],
        [ 0.9928, -0.8833,  0.9842,  0.3179, -0.5363,  0.2989],
        [ 0.9152, -0.3733,  0.9485,  0.7747, -0.8352, -0.3554],
        [ 0.8644, -0.9578, -0.5479,  0.8956, -0.7808, -0.7645],
        [-0.9952, -0.9508, -0.9496,  0.8353,  0.9576, -0.8084]],
       device='cuda:0')
squash tensor([[-1.9662e+00, -1.9021e+00, -2.1810e+00,  5.8353e-01,  2.8105e+00,
          1.0021e+00],
        [-1.7396e+00, -2.2999e+00, -2.0357e+00, -3.6407e-01,  2.2124e+00,
          2.4691e+00],
        [ 1.5695e+00,  5.1610e-01, -1.1320e+00,  4.8288e-01,  1.0314e+00,
          1.0876e+00],
        [ 2.0000e+00, -4.5631e-01,  1.9212e+00,  2.8293e-01, -1.6731e+00,
         -9.8395e-01],
        [ 2.0281e+00, -4.6225e-01,  2.6203e+00, -1.0646e-03, -1.3311e+00,
         -1.0357e+00],
        [ 3.3508e+00,  1.1360e-01,  1.3879e+00,  9.1181e-01, -2.0855e+00,
         -1.5330e+00],
        [ 7.6519e-01,  1.1778e-02, -1.0119e+00,  2.5486e-01, -2.1211e+00,
         -2.5859e+00],
        [-2.4296e+00, -2.5783e+00, -2.1362e+00,  1.1580e+00,  1.9101e+00,
          9.8205e-01],
        [-1.6917e+00, -2.1391e+00, -2.0784e+00, -1.3677e+00,  2.0698e+00,
          1.3717e+00],
        [ 2.8915e-01,  9.0237e-01, -1.9910e+00, -1.0588e-01, -3.0460e-01,
          7.5006e-02],
        [ 2.1374e+00,  5.0179e-01,  1.5796e+00,  8.5305e-01, -1.4152e+00,
         -7.0622e-01],
        [ 1.9353e+00,  8.4075e-01,  2.4806e+00,  1.9772e-01, -2.1555e+00,
          7.3877e-02],
        [ 2.1788e+00,  2.4659e-01, -6.7751e-01,  1.2063e+00, -1.3437e+00,
         -1.5355e+00],
        [-3.0255e+00, -1.2771e+00, -1.7557e+00,  7.4117e-01,  1.5345e+00,
          1.0661e+00],
        [-1.4053e+00, -2.1800e+00, -1.9767e+00, -8.0473e-01,  6.1545e-01,
          9.1534e-01],
        [ 1.3991e+00,  7.4861e-01, -2.5192e+00, -5.5158e-01,  1.1282e+00,
          2.3550e-01],
        [ 2.8147e+00, -1.3906e+00,  2.4165e+00,  3.2927e-01, -5.9893e-01,
          3.0829e-01],
        [ 1.5584e+00, -3.9224e-01,  1.8171e+00,  1.0319e+00, -1.2052e+00,
         -3.7161e-01],
        [ 1.3106e+00, -1.9186e+00, -6.1543e-01,  1.4496e+00, -1.0475e+00,
         -1.0070e+00],
        [-3.0132e+00, -1.8405e+00, -1.8275e+00,  1.2055e+00,  1.9161e+00,
         -1.1223e+00]], device='cuda:0')
action: tensor([[-0.9137, -0.7052, -0.9460,  0.3044,  0.9645,  0.7302],
        [-0.9825, -0.9935, -0.8957, -0.3790,  0.9781,  0.9727],
        [ 0.8798, -0.1312,  0.7002,  0.8354,  0.8976,  0.3639],
        [ 0.9951, -0.0663,  0.9498,  0.7477, -0.8192, -0.5952],
        [ 0.9350, -0.4015,  0.8686,  0.9686, -0.8758, -0.8610],
        [-0.8321, -0.9215, -0.9801,  0.9967, -0.4227,  0.4014],
        [-0.8004, -0.8610, -0.9927,  0.8465,  0.9670,  0.9647],
        [-0.7209,  1.0000, -0.8811, -0.9997, -0.9998, -0.9647],
        [ 0.6130,  0.9929, -0.9537, -0.9834, -0.9397,  0.7607],
        [-0.3793, -0.7334,  0.5150,  0.9414,  0.9352,  0.2968],
        [ 0.3280,  0.0359,  0.9260, -0.5295,  0.2785,  0.1573],
        [ 0.9548, -0.4571,  0.8741, -0.1888, -0.6520, -0.8492],
        [ 0.9363,  0.7556,  0.8503, -0.4795, -0.8429, -0.9472],
        [ 0.9535, -0.3419,  0.0725, -0.2253, -0.8434, -0.9644],
        [ 0.9449, -0.7936, -0.0210,  0.4645, -0.9696, -0.9874],
        [-0.9792, -0.9931, -0.9353, -0.0184,  0.9281, -0.9255],
        [-0.6645, -0.9484, -0.9460, -0.6738,  0.9977,  0.7330],
        [-0.7853, -0.6639, -0.9373, -0.8960,  0.9421,  0.8519],
        [ 0.9707,  0.9887,  0.6202, -0.2679, -0.7353,  0.7126],
        [ 0.9831, -0.8594,  0.9753,  0.0978, -0.9853,  0.2728]],
       device='cuda:0')
squash tensor([[-1.5496, -0.8775, -1.7926,  0.3144,  2.0071,  0.9292],
        [-2.3664, -2.8664, -1.4501, -0.3988,  2.2523,  2.1409],
        [ 1.3751, -0.1320,  0.8678,  1.2057,  1.4595,  0.3814],
        [ 3.0089, -0.0664,  1.8296,  0.9678, -1.1543, -0.6857],
        [ 1.6966, -0.4255,  1.3275,  2.0688, -1.3575, -1.2973],
        [-1.1950, -1.5989, -2.3009,  3.1988, -0.4510,  0.4253],
        [-1.0998, -1.2971, -2.8059,  1.2438,  2.0444,  2.0103],
        [-0.9096,  5.5501, -1.3808, -4.4740, -4.6663, -2.0096],
        [ 0.7137,  2.8154, -1.8715, -2.3904, -1.7357,  0.9979],
        [-0.3992, -0.9360,  0.5695,  1.7502,  1.6986,  0.3060],
        [ 0.3406,  0.0359,  1.6297, -0.5895,  0.2860,  0.1586],
        [ 1.8837, -0.4936,  1.3503, -0.1911, -0.7788, -1.2532],
        [ 1.7068,  0.9858,  1.2572, -0.5223, -1.2312, -1.8035],
        [ 1.8694, -0.3563,  0.0726, -0.2292, -1.2328, -2.0050],
        [ 1.7820, -1.0811, -0.0210,  0.5031, -2.0850, -2.5310],
        [-2.2784, -2.8295, -1.6993, -0.0184,  1.6445, -1.6263],
        [-0.8009, -1.8153, -1.7921, -0.8177,  3.3823,  0.9352],
        [-1.0590, -0.7997, -1.7156, -1.4514,  1.7565,  1.2630],
        [ 2.1039,  2.5871,  0.7253, -0.2746, -0.9401,  0.8924],
        [ 2.3822, -1.2912,  2.1903,  0.0981, -2.4513,  0.2798]],
       device='cuda:0')
action: tensor([[ 6.3297e-01,  3.7600e-01,  2.4096e-01,  6.7527e-01, -9.1152e-01,
         -9.1099e-01],
        [-9.7435e-01, -8.3146e-01, -9.7636e-01,  5.5141e-01,  9.7276e-01,
          8.8178e-01],
        [-9.7170e-01, -9.7340e-01, -9.8607e-01, -7.0566e-01,  9.4119e-01,
          5.4731e-01],
        [ 9.7676e-01,  1.5597e-01, -4.2229e-01,  2.2150e-01,  9.1251e-01,
         -4.4463e-02],
        [ 9.9224e-01, -4.0848e-01,  9.9678e-01,  4.0490e-01, -9.7371e-01,
         -5.0721e-01],
        [ 9.7611e-01,  7.0056e-04,  9.8278e-01, -2.0420e-01, -9.9357e-01,
         -9.0019e-01],
        [ 9.9952e-01,  2.0216e-01, -8.8918e-02,  7.8829e-01, -9.3282e-01,
         -7.1824e-01],
        [-8.5029e-01, -9.3518e-01, -9.9197e-01,  8.0406e-01,  9.7946e-01,
          9.1878e-01],
        [-9.9501e-01, -9.9229e-01, -9.8106e-01, -2.0840e-01,  9.8880e-01,
          5.1903e-01],
        [ 7.0441e-01, -1.6574e-01, -2.7795e-01,  2.6877e-01,  9.5454e-01,
          9.4752e-01],
        [ 9.6088e-01,  1.7250e-01,  9.6757e-01,  2.7089e-01, -9.2879e-01,
         -5.3785e-01],
        [ 9.2820e-01, -8.6127e-01,  9.6524e-01,  8.3883e-01, -8.5944e-01,
          7.8984e-01],
        [ 9.9808e-01, -6.6954e-01,  9.9953e-01,  5.1083e-01, -6.1321e-01,
         -6.6585e-01],
        [ 9.6207e-01, -6.9569e-01, -3.7459e-02,  2.1112e-01, -9.7229e-01,
         -9.6421e-01],
        [-9.8086e-01, -8.7264e-01, -6.0480e-01,  4.3666e-01,  9.5517e-01,
         -8.0795e-01],
        [-6.4624e-01, -9.7314e-01, -9.5924e-01, -9.3073e-01,  9.9041e-01,
          9.6359e-02],
        [-8.3850e-01,  6.9919e-01, -6.6032e-01, -9.8665e-01,  2.5978e-01,
         -5.8830e-01],
        [ 9.8169e-01,  3.5369e-01,  8.6459e-01, -7.4170e-02, -9.8238e-01,
         -8.5586e-01],
        [ 9.8025e-01,  5.9360e-01,  9.7940e-01,  5.9726e-01, -9.6087e-01,
         -9.7455e-01],
        [ 9.1563e-01, -7.5518e-01, -9.8910e-01,  9.8633e-01, -8.8460e-01,
          9.4073e-01]], device='cuda:0')
squash tensor([[ 7.4636e-01,  3.9539e-01,  2.4580e-01,  8.2036e-01, -1.5364e+00,
         -1.5333e+00],
        [-2.1717e+00, -1.1928e+00, -2.2131e+00,  6.2041e-01,  2.1412e+00,
          1.3837e+00],
        [-2.1218e+00, -2.1533e+00, -2.4799e+00, -8.7848e-01,  1.7484e+00,
          6.1453e-01],
        [ 2.2217e+00,  1.5725e-01, -4.5047e-01,  2.2523e-01,  1.5423e+00,
         -4.4492e-02],
        [ 2.7739e+00, -4.3379e-01,  3.2152e+00,  4.2949e-01, -2.1592e+00,
         -5.5897e-01],
        [ 2.2077e+00,  7.0056e-04,  2.3731e+00, -2.0711e-01, -2.8683e+00,
         -1.4732e+00],
        [ 4.1642e+00,  2.0499e-01, -8.9153e-02,  1.0669e+00, -1.6797e+00,
         -9.0400e-01],
        [-1.2572e+00, -1.6981e+00, -2.7567e+00,  1.1100e+00,  2.2840e+00,
          1.5812e+00],
        [-2.9952e+00, -2.7773e+00, -2.3249e+00, -2.1150e-01,  2.5896e+00,
          5.7501e-01],
        [ 8.7601e-01, -1.6728e-01, -2.8546e-01,  2.7554e-01,  1.8806e+00,
          1.8070e+00],
        [ 1.9572e+00,  1.7424e-01,  2.0527e+00,  2.7782e-01, -1.6495e+00,
         -6.0112e-01],
        [ 1.6452e+00, -1.2982e+00,  2.0174e+00,  1.2172e+00, -1.2912e+00,
          1.0710e+00],
        [ 3.4748e+00, -8.0990e-01,  4.1729e+00,  5.6385e-01, -7.1405e-01,
         -8.0326e-01],
        [ 1.9730e+00, -8.5890e-01, -3.7476e-02,  2.1434e-01, -2.1327e+00,
         -2.0026e+00],
        [-2.3197e+00, -1.3441e+00, -7.0067e-01,  4.6810e-01,  1.8877e+00,
         -1.1211e+00],
        [-7.6881e-01, -2.1483e+00, -1.9363e+00, -1.6638e+00,  2.6675e+00,
          9.6659e-02],
        [-1.2161e+00,  8.6571e-01, -7.9339e-01, -2.5012e+00,  2.6587e-01,
         -6.7506e-01],
        [ 2.3420e+00,  3.6966e-01,  1.3113e+00, -7.4307e-02, -2.3614e+00,
         -1.2777e+00],
        [ 2.3040e+00,  6.8320e-01,  2.2827e+00,  6.8888e-01, -1.9571e+00,
         -2.1756e+00],
        [ 1.5613e+00, -9.8490e-01, -2.6032e+00,  2.4895e+00, -1.3966e+00,
          1.7444e+00]], device='cuda:0')
action: tensor([[ 0.9724, -0.8014, -0.9455,  0.2205, -0.9912, -0.9539],
        [-0.9955, -0.9645, -0.9390,  0.9788,  0.9823,  0.9866],
        [-0.9535, -0.8364, -0.9680, -0.5045,  0.9601,  0.7008],
        [ 0.7336,  0.2630, -0.2436,  0.8329,  0.9512,  0.4305],
        [ 0.9949,  0.6554,  0.9753,  0.7895, -0.9030, -0.2620],
        [ 0.8439, -0.3312,  0.9840,  0.0298, -0.8856, -0.9350],
        [ 0.9580, -0.1109,  0.6838,  0.5281, -0.9804, -0.8660],
        [ 0.9717, -0.0024, -0.9102,  0.5650, -0.9576, -0.3763],
        [-0.8796, -0.9556, -0.9727,  0.6911,  0.9892,  0.9061],
        [-0.9479, -0.6953, -0.9243,  0.0328,  0.8562, -0.2982],
        [ 0.9157,  0.5000, -0.9246,  0.2357,  0.9168,  0.1068],
        [ 0.9899,  0.4088,  0.8936,  0.4761, -0.7725,  0.5599],
        [ 0.9944, -0.4135,  0.9953,  0.1771, -0.8119,  0.7655],
        [ 0.9910,  0.2825,  0.9346,  0.5448, -0.7426, -0.9541],
        [ 0.7653, -0.5104, -0.5515,  0.2045, -0.9410, -0.9634],
        [-0.9902, -0.9331, -0.9668,  0.5190,  0.9238,  0.0876],
        [-0.8332, -0.9516, -0.9667, -0.5451,  0.9794,  0.8811],
        [ 0.7333,  0.6851, -0.9840, -0.5971,  0.5595,  0.3879],
        [ 0.9856, -0.0038,  0.9797,  0.6396, -0.9151, -0.3965],
        [ 0.9976, -0.0793,  0.9759,  0.0228, -0.8846, -0.6789]],
       device='cuda:0')
squash tensor([[ 2.1338e+00, -1.1025e+00, -1.7877e+00,  2.2414e-01, -2.7114e+00,
         -1.8737e+00],
        [-3.0420e+00, -2.0074e+00, -1.7293e+00,  2.2690e+00,  2.3590e+00,
          2.5008e+00],
        [-1.8688e+00, -1.2092e+00, -2.0592e+00, -5.5530e-01,  1.9475e+00,
          8.6892e-01],
        [ 9.3655e-01,  2.6932e-01, -2.4862e-01,  1.1977e+00,  1.8444e+00,
          4.6055e-01],
        [ 2.9863e+00,  7.8472e-01,  2.1910e+00,  1.0701e+00, -1.4882e+00,
         -2.6820e-01],
        [ 1.2346e+00, -3.4416e-01,  2.4115e+00,  2.9801e-02, -1.4011e+00,
         -1.6966e+00],
        [ 1.9209e+00, -1.1140e-01,  8.3617e-01,  5.8754e-01, -2.3067e+00,
         -1.3170e+00],
        [ 2.1215e+00, -2.4352e-03, -1.5288e+00,  6.4009e-01, -1.9156e+00,
         -3.9577e-01],
        [-1.3740e+00, -1.8924e+00, -2.1404e+00,  8.5005e-01,  2.6094e+00,
          1.5056e+00],
        [-1.8102e+00, -8.5815e-01, -1.6178e+00,  3.2837e-02,  1.2788e+00,
         -3.0758e-01],
        [ 1.5620e+00,  5.4937e-01, -1.6197e+00,  2.4024e-01,  1.5686e+00,
          1.0722e-01],
        [ 2.6440e+00,  4.3415e-01,  1.4397e+00,  5.1790e-01, -1.0265e+00,
          6.3271e-01],
        [ 2.9349e+00, -4.3983e-01,  3.0220e+00,  1.7894e-01, -1.1325e+00,
          1.0095e+00],
        [ 2.6984e+00,  2.9035e-01,  1.6938e+00,  6.1089e-01, -9.5615e-01,
         -1.8759e+00],
        [ 1.0090e+00, -5.6324e-01, -6.2058e-01,  2.0739e-01, -1.7471e+00,
         -1.9908e+00],
        [-2.6552e+00, -1.6816e+00, -2.0411e+00,  5.7503e-01,  1.6143e+00,
          8.7841e-02],
        [-1.1986e+00, -1.8482e+00, -2.0398e+00, -6.1139e-01,  2.2826e+00,
          1.3805e+00],
        [ 9.3572e-01,  8.3869e-01, -2.4106e+00, -6.8867e-01,  6.3205e-01,
          4.0936e-01],
        [ 2.4641e+00, -3.8030e-03,  2.2906e+00,  7.5741e-01, -1.5578e+00,
         -4.1950e-01],
        [ 3.3591e+00, -7.9424e-02,  2.2035e+00,  2.2851e-02, -1.3964e+00,
         -8.2701e-01]], device='cuda:0')
action: tensor([[ 0.9860, -0.3134,  0.9074,  0.6178, -0.9339, -0.8835],
        [ 0.8843, -0.8299, -0.6937,  0.7293, -0.9562, -0.9792],
        [-0.9924, -0.9818, -0.9033,  0.3653,  0.9623, -0.9278],
        [-0.8586, -0.9813, -0.9746, -0.8245,  0.9606,  0.4624],
        [ 0.2780,  0.6925, -0.9496, -0.6583, -0.7182,  0.6696],
        [ 0.9572,  0.4391,  0.9911,  0.4458, -0.8991, -0.3749],
        [ 0.9798,  0.4396,  0.9529,  0.4367, -0.8703, -0.9604],
        [ 0.9250,  0.2190, -0.2060,  0.8287, -0.9734, -0.8038],
        [-0.9912, -0.6748, -0.9922,  0.6802,  0.9753,  0.6457],
        [-0.8862, -0.9231, -0.9570, -0.3689,  0.9899,  0.4931],
        [ 0.9814,  0.2940, -0.8772, -0.2375,  0.3006,  0.0309],
        [ 0.9774, -0.4074,  0.9534,  0.4467, -0.2534,  0.4514],
        [ 0.9599, -0.0262,  0.9575, -0.2222, -0.8835, -0.8353],
        [ 0.9974,  0.7149,  0.9935,  0.2121, -0.9364, -0.9179],
        [ 0.9313, -0.0749, -0.2222,  0.6244, -0.9750, -0.8090],
        [-0.9939, -0.9176, -0.7916, -0.0743,  0.9863, -0.0265],
        [-0.9718, -0.6756, -0.9863, -0.2607,  0.9690,  0.3048],
        [ 0.9022,  0.3565, -0.6484, -0.5307,  0.7138,  0.3772],
        [ 0.9826, -0.0303,  0.9256,  0.3423, -0.8926, -0.4211],
        [ 0.9955, -0.4118,  0.9571,  0.7095, -0.9407, -0.8801]],
       device='cuda:0')
squash tensor([[ 2.4761, -0.3243,  1.5125,  0.7214, -1.6879, -1.3914],
        [ 1.3951, -1.1879, -0.8550,  0.9272, -1.8998, -2.2784],
        [-2.7828, -2.3457, -1.4898,  0.3830,  1.9755, -1.6421],
        [-1.2880, -2.3315, -2.1772, -1.1708,  1.9534,  0.5004],
        [ 0.2855,  0.8528, -1.8275, -0.7898, -0.9039,  0.8101],
        [ 1.9112,  0.4711,  2.7040,  0.4794, -1.4674, -0.3941],
        [ 2.2927,  0.4717,  1.8624,  0.4682, -1.3342, -1.9505],
        [ 1.6224,  0.2226, -0.2090,  1.1841, -2.1539, -1.1093],
        [-2.7082, -0.8195, -2.7734,  0.8294,  2.1905,  0.7679],
        [-1.4040, -1.6098, -1.9085, -0.3871,  2.6421,  0.5402],
        [ 2.3338,  0.3030, -1.3635, -0.2421,  0.3102,  0.0309],
        [ 2.2359, -0.4324,  1.8675,  0.4806, -0.2590,  0.4864],
        [ 1.9445, -0.0262,  1.9150, -0.2260, -1.3915, -1.2056],
        [ 3.3189,  0.8972,  2.8647,  0.2154, -1.7084, -1.5754],
        [ 1.6681, -0.0751, -0.2259,  0.7323, -2.1852, -1.1241],
        [-2.8941, -1.5735, -1.0758, -0.0744,  2.4887, -0.0265],
        [-2.1246, -0.8211, -2.4868, -0.2669,  2.0758,  0.3148],
        [ 1.4842,  0.3728, -0.7725, -0.5911,  0.8948,  0.3968],
        [ 2.3675, -0.0303,  1.6271,  0.3567, -1.4346, -0.4490],
        [ 3.0465, -0.4377,  1.9097,  0.8861, -1.7444, -1.3764]],
       device='cuda:0')
action: tensor([[ 0.9872,  0.2671,  0.6971,  0.2297, -0.9584, -0.9186],
        [ 0.9768,  0.3848, -0.9538,  0.2580, -0.9129,  0.0403],
        [-0.8907, -0.9432, -0.9237,  0.3496,  0.9976,  0.9603],
        [-0.9701, -0.9724, -0.9919, -0.0310,  0.9661,  0.5836],
        [ 0.8338, -0.2494, -0.2475,  0.3403,  0.5559,  0.9478],
        [ 0.8360, -0.1180,  0.9225,  0.7599, -0.5394,  0.4433],
        [-0.8828, -0.5684, -0.1242,  0.8341, -0.7302,  0.8535],
        [-0.9051,  0.8844, -0.7388, -0.3593, -0.5213,  0.7002],
        [ 0.7592,  0.2754, -0.8650, -0.8405, -0.3039, -0.0749],
        [ 0.9914, -0.7489,  0.9906, -0.9566, -0.9754, -0.9549],
        [ 0.9875, -0.9481, -0.9645,  0.9067, -0.9900, -0.9780],
        [-0.9889, -0.8735, -0.9495,  0.3385,  0.9938,  0.8228],
        [-0.9781, -0.9728, -0.9038, -0.5279,  0.9324,  0.9852],
        [ 0.9167,  0.5038, -0.3163,  0.4758,  0.9539,  0.2534],
        [ 0.9959,  0.6685,  0.9055,  0.9146, -0.9186, -0.8673],
        [ 0.9723,  0.7878,  0.8609,  0.6317, -0.9506, -0.5406],
        [ 0.9877, -0.0669, -0.7162,  0.9961, -0.9664,  0.2826],
        [-0.9963, -0.7543, -0.9606,  0.9878,  0.9939,  0.9783],
        [-0.9798, -0.9904, -0.9240, -0.2731,  0.9084,  0.8333],
        [ 0.1002,  0.6276, -0.6594, -0.9668,  0.2844,  0.8838]],
       device='cuda:0')
squash tensor([[ 2.5240,  0.2738,  0.8616,  0.2339, -1.9264, -1.5800],
        [ 2.2233,  0.4057, -1.8725,  0.2640, -1.5448,  0.0403],
        [-1.4252, -1.7659, -1.6139,  0.3650,  3.3641,  1.9494],
        [-2.0932, -2.1344, -2.7521, -0.0310,  2.0306,  0.6679],
        [ 1.2006, -0.2548, -0.2527,  0.3544,  0.6269,  1.8094],
        [ 1.2078, -0.1185,  1.6053,  0.9960, -0.6033,  0.4764],
        [-1.3883, -0.6451, -0.1249,  1.2016, -0.9291,  1.2691],
        [-1.4996,  1.3957, -0.9479, -0.3761, -0.5781,  0.8677],
        [ 0.9944,  0.2827, -1.3130, -1.2230, -0.3138, -0.0750],
        [ 2.7197, -0.9706,  2.6755, -1.9039, -2.1923, -1.8842],
        [ 2.5339, -1.8123, -2.0063,  1.5085, -2.6490, -2.2492],
        [-2.5953, -1.3479, -1.8268,  0.3524,  2.8886,  1.1653],
        [-2.2511, -2.1421, -1.4924, -0.5872,  1.6767,  2.4488],
        [ 1.5677,  0.5544, -0.3275,  0.5175,  1.8732,  0.2590],
        [ 3.0918,  0.8080,  1.5019,  1.5552, -1.5802, -1.3221],
        [ 2.1325,  1.0655,  1.2968,  0.7442, -1.8383, -0.6050],
        [ 2.5431, -0.0670, -0.8998,  3.1236, -2.0349,  0.2905],
        [-3.1457, -0.9828, -1.9531,  2.5470,  2.8912,  2.2564],
        [-2.2919, -2.6687, -1.6157, -0.2802,  1.5186,  1.1987],
        [ 0.1005,  0.7374, -0.7918, -2.0415,  0.2925,  1.3928]],
       device='cuda:0')
action: tensor([[ 9.9997e-01, -4.8733e-01, -9.0581e-01, -3.9506e-01, -9.9886e-01,
         -9.7581e-01],
        [-9.9468e-01, -7.0867e-01, -9.7118e-01,  9.3291e-01,  9.9481e-01,
          9.7100e-01],
        [-9.6622e-01, -9.9461e-01, -6.4314e-01, -2.1528e-01,  9.9588e-01,
          9.8666e-01],
        [-9.4260e-01, -5.0446e-01, -7.6014e-01,  8.1383e-01,  9.6373e-01,
          1.3054e-01],
        [ 8.9357e-01, -3.7639e-01,  9.2557e-01,  8.2331e-01,  6.6908e-01,
          6.6758e-01],
        [ 9.9817e-01, -5.8952e-01,  5.3556e-01,  4.1551e-01, -7.3182e-01,
          2.1806e-01],
        [ 9.5767e-01, -3.7939e-01,  9.5980e-01,  5.3037e-02, -9.0716e-01,
         -6.2038e-01],
        [ 9.8500e-01,  5.2728e-01,  7.3412e-01,  5.0203e-01, -8.5031e-01,
         -6.5896e-01],
        [ 9.5820e-01,  5.8357e-04, -4.2218e-01,  1.6823e-01, -8.6601e-01,
         -9.0251e-01],
        [-9.8935e-01, -9.5318e-01, -9.4076e-01,  7.7701e-02,  9.6547e-01,
          1.9701e-01],
        [-9.2956e-01, -9.8254e-01, -9.4248e-01, -6.4915e-01,  9.0619e-01,
          9.4258e-01],
        [ 9.7157e-01,  2.5627e-01, -1.2414e-02,  6.8727e-02,  3.7597e-01,
         -4.0794e-01],
        [ 9.9884e-01,  4.0542e-01,  9.8421e-01,  7.4603e-02, -9.3152e-01,
         -8.3145e-01],
        [ 9.9863e-01,  6.7962e-01,  9.8625e-01,  9.9531e-02, -9.5952e-01,
         -9.0818e-01],
        [ 9.9448e-01,  4.6007e-01, -8.5612e-01,  6.8247e-01, -8.9377e-01,
         -7.3242e-01],
        [-9.7474e-01, -8.6340e-01, -9.7018e-01,  6.7092e-01,  9.7345e-01,
          5.8209e-01],
        [-9.8378e-01, -9.7630e-01, -9.2000e-01, -1.4741e-01,  9.8751e-01,
          8.5762e-01],
        [ 9.3993e-01,  6.9630e-01, -9.4388e-01, -8.3295e-01,  5.7736e-01,
          1.6702e-01],
        [ 8.6106e-01, -5.1678e-01,  9.8413e-01,  4.0716e-01, -3.3039e-02,
          4.1443e-01],
        [ 6.6073e-01, -7.5742e-01,  9.0197e-01,  9.2395e-01, -5.5283e-01,
          4.6922e-02]], device='cuda:0')
squash tensor([[ 5.4863e+00, -5.3256e-01, -1.5037e+00, -4.1778e-01, -3.7365e+00,
         -2.2015e+00],
        [-2.9637e+00, -8.8451e-01, -2.1127e+00,  1.6804e+00,  2.9761e+00,
          2.1096e+00],
        [-2.0319e+00, -2.9567e+00, -7.6352e-01, -2.1870e-01,  3.0921e+00,
          2.5016e+00],
        [-1.7609e+00, -5.5528e-01, -9.9655e-01,  1.1383e+00,  1.9958e+00,
          1.3129e-01],
        [ 1.4394e+00, -3.9585e-01,  1.6266e+00,  1.1670e+00,  8.0907e-01,
          8.0636e-01],
        [ 3.4970e+00, -6.7693e-01,  5.9791e-01,  4.4226e-01, -9.3264e-01,
          2.2162e-01],
        [ 1.9170e+00, -3.9935e-01,  1.9433e+00,  5.3087e-02, -1.5112e+00,
         -7.2562e-01],
        [ 2.4426e+00,  5.8637e-01,  9.3761e-01,  5.5201e-01, -1.2573e+00,
         -7.9097e-01],
        [ 1.9235e+00,  5.8357e-04, -4.5034e-01,  1.6984e-01, -1.3169e+00,
         -1.4856e+00],
        [-2.6149e+00, -1.8655e+00, -1.7446e+00,  7.7858e-02,  2.0209e+00,
          1.9962e-01],
        [-1.6551e+00, -2.3662e+00, -1.7598e+00, -7.7382e-01,  1.5058e+00,
          1.7607e+00],
        [ 2.1195e+00,  2.6211e-01, -1.2415e-02,  6.8836e-02,  3.9536e-01,
         -4.3314e-01],
        [ 3.7266e+00,  4.3012e-01,  2.4169e+00,  7.4742e-02, -1.6697e+00,
         -1.1928e+00],
        [ 3.6434e+00,  8.2841e-01,  2.4863e+00,  9.9862e-02, -1.9399e+00,
         -1.5170e+00],
        [ 2.9448e+00,  4.9741e-01, -1.2786e+00,  8.3373e-01, -1.4403e+00,
         -9.3394e-01],
        [-2.1796e+00, -1.3065e+00, -2.0954e+00,  8.1241e-01,  2.1543e+00,
          6.6562e-01],
        [-2.4033e+00, -2.2118e+00, -1.5890e+00, -1.4849e-01,  2.5348e+00,
          1.2843e+00],
        [ 1.7375e+00,  8.6007e-01, -1.7725e+00, -1.1977e+00,  6.5850e-01,
          1.6860e-01],
        [ 1.2974e+00, -5.7193e-01,  2.4142e+00,  4.3220e-01, -3.3051e-02,
          4.4095e-01],
        [ 7.9410e-01, -9.9013e-01,  1.4827e+00,  1.6154e+00, -6.2245e-01,
          4.6956e-02]], device='cuda:0')
action: tensor([[ 0.9949,  0.0870,  0.9666,  0.6597, -0.2569, -0.1434],
        [ 0.9653,  0.0508,  0.9090,  0.3998, -0.5645, -0.2464],
        [ 0.9920,  0.4713,  0.3896,  0.7086, -0.9231, -0.9675],
        [-0.9629, -0.9790, -0.8872,  0.5153,  0.9708, -0.3766],
        [-0.9662, -0.9753, -0.9090, -0.3907,  0.9863,  0.8064],
        [ 0.8347,  0.6536, -0.8665, -0.7519,  0.1707, -0.5831],
        [ 0.9831, -0.7242,  0.9944, -0.2467, -0.7159,  0.5434],
        [ 0.9799, -0.3420,  0.9696,  0.0784, -0.6956, -0.9170],
        [ 0.9602, -0.6488, -0.8941,  0.9802, -0.8394, -0.9418],
        [-0.9940, -0.8633, -0.9234,  0.4420,  0.9792, -0.3202],
        [-0.9521, -0.9934, -0.8957, -0.5068,  0.9332,  0.5058],
        [ 0.4369,  0.6727, -0.8112, -0.5027,  0.4304, -0.0279],
        [ 0.9924, -0.0104,  0.9810, -0.0251, -0.6710,  0.5626],
        [ 0.9874,  0.0016,  0.9862, -0.1056, -0.9157, -0.2031],
        [ 0.9923,  0.7516,  0.5982,  0.4553, -0.5347, -0.6857],
        [ 0.9166, -0.2956, -0.5186,  0.2174, -0.9420, -0.9758],
        [-0.9964, -0.9577, -0.7725,  0.3983,  0.9203,  0.2160],
        [-0.9160, -0.9918, -0.9694, -0.7681,  0.9904,  0.7821],
        [ 0.7146,  0.4746, -0.4596, -0.2606,  0.6679,  0.5836],
        [ 0.9653, -0.0694,  0.9907,  0.1208, -0.9182, -0.8982]],
       device='cuda:0')
squash tensor([[ 2.9826e+00,  8.7243e-02,  2.0374e+00,  7.9235e-01, -2.6283e-01,
         -1.4438e-01],
        [ 2.0177e+00,  5.0829e-02,  1.5219e+00,  4.2336e-01, -6.3939e-01,
         -2.5157e-01],
        [ 2.7569e+00,  5.1168e-01,  4.1132e-01,  8.8444e-01, -1.6093e+00,
         -2.0515e+00],
        [-1.9838e+00, -2.2736e+00, -1.4086e+00,  5.6992e-01,  2.1064e+00,
         -3.9611e-01],
        [-2.0319e+00, -2.1903e+00, -1.5218e+00, -4.1263e-01,  2.4895e+00,
          1.1167e+00],
        [ 1.2035e+00,  7.8157e-01, -1.3188e+00, -9.7736e-01,  1.7243e-01,
         -6.6721e-01],
        [ 2.3836e+00, -9.1642e-01,  2.9338e+00, -2.5185e-01, -8.9927e-01,
          6.0898e-01],
        [ 2.2940e+00, -3.5630e-01,  2.0851e+00,  7.8608e-02, -8.5877e-01,
         -1.5698e+00],
        [ 1.9482e+00, -7.7322e-01, -1.4422e+00,  2.3030e+00, -1.2192e+00,
         -1.7535e+00],
        [-2.9010e+00, -1.3061e+00, -1.6113e+00,  4.7469e-01,  2.2789e+00,
         -3.3192e-01],
        [-1.8535e+00, -2.8530e+00, -1.4498e+00, -5.5845e-01,  1.6824e+00,
          5.5712e-01],
        [ 4.6842e-01,  8.1569e-01, -1.1305e+00, -5.5296e-01,  4.6036e-01,
         -2.7870e-02],
        [ 2.7867e+00, -1.0361e-02,  2.3234e+00, -2.5145e-02, -8.1248e-01,
          6.3669e-01],
        [ 2.5300e+00,  1.6097e-03,  2.4844e+00, -1.0601e-01, -1.5616e+00,
         -2.0591e-01],
        [ 2.7785e+00,  9.7669e-01,  6.9034e-01,  4.9140e-01, -5.9664e-01,
         -8.3983e-01],
        [ 1.5671e+00, -3.0467e-01, -5.7438e-01,  2.2096e-01, -1.7558e+00,
         -2.2015e+00],
        [-3.1618e+00, -1.9172e+00, -1.0266e+00,  4.2161e-01,  1.5908e+00,
          2.1944e-01],
        [-1.5634e+00, -2.7490e+00, -2.0820e+00, -1.0156e+00,  2.6695e+00,
          1.0508e+00],
        [ 8.9662e-01,  5.1601e-01, -4.9677e-01, -2.6671e-01,  8.0700e-01,
          6.6796e-01],
        [ 2.0182e+00, -6.9468e-02,  2.6818e+00,  1.2139e-01, -1.5772e+00,
         -1.4626e+00]], device='cuda:0')
action: tensor([[-0.9988,  0.9928, -0.9808, -0.9800, -0.9291,  0.1874],
        [ 0.3221,  0.9718, -0.9272, -0.8824, -0.5523,  0.4929],
        [ 0.9989, -0.6604,  0.9497, -0.9849, -0.9102, -0.8364],
        [ 0.9910,  0.8078, -0.9639,  0.1631, -0.9479, -0.7759],
        [-0.9939, -0.8773, -0.8435,  0.9220,  0.9859,  0.9912],
        [-0.9767, -0.9777, -0.9552, -0.7187,  0.9880,  0.8978],
        [ 0.9609,  0.2756, -0.7016,  0.7610,  0.9154,  0.8984],
        [ 0.9984, -0.5948,  0.9866,  0.6949, -0.9848, -0.2985],
        [ 0.9862,  0.0093,  0.9606,  0.9726, -0.9815, -0.6103],
        [ 0.6934, -0.9393, -0.9631,  0.9902, -0.7499, -0.4701],
        [-0.9111, -0.9632, -0.9905,  0.9957,  0.9894,  0.9798],
        [-0.9623, -0.9838, -0.9913, -0.4420,  0.8833,  0.4541],
        [ 0.4419,  0.9739, -0.9660, -0.9792, -0.5165,  0.8732],
        [ 0.9847,  0.9487,  0.9286,  0.6312, -0.2388,  0.2429],
        [-0.9737, -0.3313, -0.8785,  0.2304,  0.7569, -0.0949],
        [ 0.0376,  0.7690, -0.4785, -0.3574,  0.5491,  0.3647],
        [-0.5723,  0.4418, -0.6820, -0.4826, -0.4553,  0.6545],
        [-0.9941,  0.8180, -0.5699, -0.9706, -0.8919,  0.4037],
        [ 0.3975,  0.9167, -0.9699, -0.9263, -0.6205, -0.3889],
        [ 0.9855, -0.8764,  0.9944, -0.9839, -0.8136, -0.9791]],
       device='cuda:0')
squash tensor([[-3.7281,  2.8141, -2.3178, -2.2983, -1.6517,  0.1896],
        [ 0.3339,  2.1240, -1.6381, -1.3867, -0.6216,  0.5399],
        [ 3.7514, -0.7936,  1.8288, -2.4383, -1.5285, -1.2089],
        [ 2.6989,  1.1206, -1.9983,  0.1645, -1.8104, -1.0350],
        [-2.8958, -1.3637, -1.2333,  1.6023,  2.4743,  2.7089],
        [-2.2194, -2.2419, -1.8881, -0.9050,  2.5548,  1.4608],
        [ 1.9579,  0.2829, -0.8705,  0.9985,  1.5601,  1.4638],
        [ 3.5682, -0.6851,  2.4989,  0.8574, -2.4356, -0.3078],
        [ 2.4834,  0.0093,  1.9532,  2.1383, -2.3358, -0.7094],
        [ 0.8545, -1.7321, -1.9869,  2.6582, -0.9728, -0.5102],
        [-1.5342, -1.9882, -2.6720,  3.0703,  2.6169,  2.2937],
        [-1.9759, -2.4050, -2.7175, -0.4747,  1.3908,  0.4898],
        [ 0.4747,  2.1628, -2.0290, -2.2768, -0.5716,  1.3463],
        [ 2.4343,  1.8182,  1.6480,  0.7434, -0.2435,  0.2478],
        [-2.1584, -0.3443, -1.3691,  0.2346,  0.9889, -0.0951],
        [ 0.0376,  1.0179, -0.5210, -0.3739,  0.6171,  0.3823],
        [-0.6509,  0.4745, -0.8328, -0.5264, -0.4914,  0.7831],
        [-2.9125,  1.1509, -0.6473, -2.1031, -1.4311,  0.4281],
        [ 0.4207,  1.5682, -2.0905, -1.6319, -0.7259, -0.4105],
        [ 2.4614, -1.3600,  2.9355, -2.4080, -1.1375, -2.2750]],
       device='cuda:0')
action: tensor([[ 0.9078,  0.8599, -0.8881, -0.9590, -0.8144, -0.2991],
        [ 0.9648, -0.9764,  0.9876, -0.9313, -0.9618, -0.9859],
        [ 0.8999,  0.1491, -0.8888,  0.7739, -0.9641, -0.9631],
        [-0.9964, -0.9736, -0.9715,  0.6649,  0.9632,  0.9675],
        [-0.9637, -0.9917, -0.7220, -0.7997,  0.9725,  0.9804],
        [ 0.7637,  0.8753, -0.9023,  0.3370,  0.4067,  0.3721],
        [ 0.9913,  0.1205,  0.9836,  0.8036, -0.9792, -0.9195],
        [ 0.9828,  0.7671,  0.9317,  0.8160, -0.9742, -0.9347],
        [ 0.9141, -0.2590, -0.9951,  0.9605, -0.9667,  0.4254],
        [-0.9256, -0.9189, -0.9638,  0.9848,  0.9533,  0.9217],
        [-0.9516, -0.9719, -0.9470,  0.0948,  0.9438,  0.4510],
        [ 0.9758,  0.7894, -0.9802, -0.7381,  0.1290,  0.7734],
        [ 0.8708,  0.2134,  0.9702,  0.5116, -0.6634, -0.3018],
        [-0.8074, -0.3748,  0.4459,  0.7706,  0.2775,  0.3390],
        [-0.9626,  0.9898, -0.8980, -0.8053, -0.7286,  0.6618],
        [ 0.9192,  0.9163, -0.8646, -0.9878, -0.9338, -0.9357],
        [ 0.9211, -0.9522,  0.9398, -0.9257, -0.9409, -0.6811],
        [ 0.9870,  0.0449, -0.8581,  0.8939, -0.9761, -0.9417],
        [-0.9763, -0.7915, -0.9923,  0.8378,  0.9966,  0.9952],
        [-0.9648, -0.9937, -0.9588, -0.9389,  0.9523,  0.2855]],
       device='cuda:0')
squash tensor([[ 1.5151,  1.2929, -1.4130, -1.9339, -1.1401, -0.3085],
        [ 2.0109, -2.2149,  2.5393, -1.6680, -1.9693, -2.4754],
        [ 1.4719,  0.1502, -1.4162,  1.0299, -2.0010, -1.9870],
        [-3.1607, -2.1579, -2.1175,  0.8015,  1.9881,  2.0518],
        [-1.9953, -2.7417, -0.9119, -1.0977,  2.1365,  2.3069],
        [ 1.0051,  1.3554, -1.4843,  0.3507,  0.4316,  0.3908],
        [ 2.7143,  0.1211,  2.3981,  1.1087, -2.2779, -1.5858],
        [ 2.3732,  1.0133,  1.6711,  1.1449, -2.1682, -1.6941],
        [ 1.5520, -0.2650, -3.0039,  1.9521, -2.0388,  0.4543],
        [-1.6265, -1.5817, -1.9963,  2.4351,  1.8670,  1.6003],
        [-1.8481, -2.1264, -1.8017,  0.0951,  1.7716,  0.4860],
        [ 2.2003,  1.0698, -2.3022, -0.9462,  0.1298,  1.0288],
        [ 1.3366,  0.2167,  2.0958,  0.5649, -0.7989, -0.3115],
        [-1.1194, -0.3939,  0.4795,  1.0218,  0.2849,  0.3530],
        [-1.9800,  2.6345, -1.4619, -1.1135, -0.9257,  0.7960],
        [ 1.5840,  1.5656, -1.3113, -2.5464, -1.6875, -1.7022],
        [ 1.5963, -1.8549,  1.7367, -1.6278, -1.7459, -0.8313],
        [ 2.5139,  0.0449, -1.2860,  1.4412, -2.2075, -1.7524],
        [-2.2127, -1.0754, -2.7758,  1.2136,  3.1915,  3.0170],
        [-2.0106, -2.8799, -1.9311, -1.7289,  1.8562,  0.2937]],
       device='cuda:0')
action: tensor([[ 0.6810, -0.0171, -0.9520,  0.7537, -0.9479, -0.9529],
        [-0.9559, -0.9516, -0.8359,  0.3138,  0.9769,  0.4104],
        [-0.8898, -0.9942, -0.8767, -0.8643,  0.9776,  0.9763],
        [ 0.9588,  0.5513, -0.0370,  0.2264,  0.0160, -0.1879],
        [ 0.9581, -0.1403,  0.8859,  0.1970, -0.8837, -0.9703],
        [ 0.9876,  0.1372,  0.8501,  0.7631, -0.9194, -0.4167],
        [ 0.8996, -0.4897, -0.9634,  0.9623, -0.9679,  0.6309],
        [-0.9824, -0.9080, -0.9843,  0.9611,  0.9884,  0.9630],
        [-0.9823, -0.9704, -0.9841,  0.3193,  0.9058, -0.0085],
        [ 0.0236,  0.7980, -0.8107, -0.9600,  0.0235,  0.1746],
        [ 0.9978,  0.8734,  0.9551,  0.6069, -0.7105, -0.7395],
        [-0.9960,  0.8517, -0.9469, -0.3078,  0.6631,  0.8703],
        [ 0.7846,  0.9365, -0.9765, -0.8657, -0.4960,  0.3610],
        [ 0.9954, -0.7117,  0.9866, -0.9046, -0.6816, -0.6707],
        [ 0.9992,  0.7444, -0.1749, -0.5655, -0.9905, -0.8796],
        [ 0.6177, -0.1405, -0.2614,  0.3391, -0.8394, -0.4068],
        [-0.9955, -0.9345, -0.8534,  0.6252,  0.9425,  0.6110],
        [-0.9111, -0.9876, -0.9494, -0.6467,  0.9822,  0.9935],
        [ 0.3776,  0.8262, -0.6600, -0.0425,  0.6138, -0.0902],
        [ 0.9751, -0.3286,  0.9928,  0.4581, -0.9388, -0.7627]],
       device='cuda:0')
squash tensor([[ 0.8310, -0.0171, -1.8523,  0.9814, -1.8105, -1.8629],
        [-1.8958, -1.8488, -1.2074,  0.3248,  2.2249,  0.4361],
        [-1.4212, -2.9231, -1.3611, -1.3103,  2.2399,  2.2115],
        [ 1.9308,  0.6203, -0.0370,  0.2304,  0.0160, -0.1901],
        [ 1.9218, -0.1413,  1.4024,  0.1996, -1.3923, -2.0974],
        [ 2.5398,  0.1381,  1.2564,  1.0035, -1.5852, -0.4437],
        [ 1.4702, -0.5356, -1.9913,  1.9764, -2.0573,  0.7429],
        [-2.3634, -1.5159, -2.4184,  1.9596,  2.5730,  1.9863],
        [-2.3598, -2.0994, -2.4143,  0.3309,  1.5036, -0.0085],
        [ 0.0236,  1.0932, -1.1290, -1.9456,  0.0235,  0.1764],
        [ 3.3981,  1.3472,  1.8872,  0.7040, -0.8883, -0.9493],
        [-3.1071,  1.2624, -1.8012, -0.3181,  0.7983,  1.3341],
        [ 1.0572,  1.7088, -2.2157, -1.3155, -0.5440,  0.3781],
        [ 3.0357, -0.8906,  2.5003, -1.4969, -0.8322, -0.8121],
        [ 3.8984,  0.9603, -0.1767, -0.6409, -2.6705, -1.3739],
        [ 0.7213, -0.1414, -0.2676,  0.3531, -1.2192, -0.4318],
        [-3.0495, -1.6929, -1.2684,  0.7335,  1.7602,  0.7104],
        [-1.5339, -2.5365, -1.8256, -0.7696,  2.3554,  2.8609],
        [ 0.3972,  1.1760, -0.7927, -0.0425,  0.7150, -0.0905],
        [ 2.1876, -0.3413,  2.8148,  0.4949, -1.7279, -1.0027]],
       device='cuda:0')
action: tensor([[ 0.2842,  0.7928, -0.9780, -0.9897, -0.6012, -0.7849],
        [ 0.9965, -0.8497,  0.9939, -0.9550, -0.9494, -0.7216],
        [ 0.9898,  0.6872, -0.9382,  0.3792, -0.9477, -0.9172],
        [-0.9964, -0.9431, -0.9848,  0.8392,  0.9481,  0.9874],
        [-0.9394, -0.9677, -0.8800, -0.8768,  0.9959,  0.8249],
        [ 0.6714,  0.6313, -0.4903,  0.6353,  0.6384,  0.2024],
        [ 0.9962, -0.1936,  0.9872,  0.6318, -0.9693, -0.5002],
        [ 0.9594,  0.7305,  0.8071, -0.1289, -0.9611, -0.9793],
        [ 0.9846,  0.1690, -0.2303,  0.8466, -0.9585, -0.1411],
        [-0.9767, -0.7889, -0.9909,  0.9242,  0.9752,  0.9588],
        [-0.8960, -0.9846, -0.9311, -0.2636,  0.9754,  0.9623],
        [ 0.5318, -0.5521, -0.7580, -0.1788,  0.2952,  0.8946],
        [ 0.9678,  0.6646,  0.9218,  0.5444, -0.5181,  0.3258],
        [-0.9794,  0.7568, -0.9687, -0.9806, -0.1230, -0.0717],
        [ 0.7138,  0.9061, -0.9407, -0.9592, -0.0289,  0.1946],
        [ 0.9939, -0.5450,  0.9360, -0.9289, -0.9742, -0.9594],
        [ 0.9994,  0.0932,  0.0599, -0.3732, -0.9666, -0.7135],
        [-0.8744,  0.0907, -0.9726,  0.7503,  0.9760,  0.9844],
        [-0.9682, -0.9951, -0.9896, -0.1302,  0.9589,  0.9566],
        [-0.6563, -0.0797, -0.8988,  0.4459,  0.7239, -0.1251]],
       device='cuda:0')
squash tensor([[ 0.2922,  1.0788, -2.2488, -2.6324, -0.6950, -1.0581],
        [ 3.1772, -1.2549,  2.8926, -1.8859, -1.8253, -0.9109],
        [ 2.6366,  0.8427, -1.7224,  0.3991, -1.8089, -1.5713],
        [-3.1538, -1.7654, -2.4373,  1.2184,  1.8124,  2.5286],
        [-1.7326, -2.0554, -1.3756, -1.3618,  3.0942,  1.1718],
        [ 0.8133,  0.7436, -0.5365,  0.7503,  0.7555,  0.2053],
        [ 3.1287, -0.1960,  2.5235,  0.7444, -2.0800, -0.5496],
        [ 1.9382,  0.9298,  1.1187, -0.1296, -1.9605, -2.2805],
        [ 2.4288,  0.1706, -0.2345,  1.2439, -1.9269, -0.1420],
        [-2.2202, -1.0686, -2.6946,  1.6174,  2.1896,  1.9304],
        [-1.4517, -2.4294, -1.6662, -0.2700,  2.1929,  1.9763],
        [ 0.5926, -0.6215, -0.9915, -0.1808,  0.3043,  1.4446],
        [ 2.0561,  0.8010,  1.6010,  0.6104, -0.5738,  0.3382],
        [-2.2823,  0.9886, -2.0712, -2.3133, -0.1237, -0.0718],
        [ 0.8950,  1.5056, -1.7440, -1.9354, -0.0289,  0.1971],
        [ 2.8952, -0.6113,  1.7046, -1.6503, -2.1690, -1.9387],
        [ 4.0279,  0.0934,  0.0600, -0.3922, -2.0376, -0.8944],
        [-1.3517,  0.0909, -2.1384,  0.9735,  2.2050,  2.4225],
        [-2.0635, -3.0004, -2.6269, -0.1309,  1.9319,  1.9037],
        [-0.7863, -0.0799, -1.4658,  0.4796,  0.9157, -0.1257]],
       device='cuda:0')
action: tensor([[ 0.9961,  0.9116,  0.9607,  0.0306, -0.9189, -0.9575],
        [ 0.9927, -0.1300, -0.7421, -0.1952, -0.2629, -0.9250],
        [-0.9925, -0.9309, -0.9586,  0.0794,  0.9766,  0.4124],
        [-0.4189, -0.9939, -0.9702, -0.7459,  0.9849,  0.9087],
        [ 0.6095,  0.0177, -0.1936, -0.0151,  0.8714,  0.7243],
        [ 0.9658,  0.6756,  0.9475, -0.0313, -0.6083,  0.4415],
        [ 0.9903, -0.6276,  0.9465,  0.3824, -0.5891, -0.7688],
        [ 0.9872, -0.3905,  0.9259,  0.7754, -0.7769, -0.8466],
        [ 0.7501, -0.6940, -0.7388,  0.3289, -0.9180, -0.9707],
        [-0.9907, -0.9763, -0.9625,  0.4839,  0.9830, -0.5241],
        [-0.9723, -0.9965, -0.9613, -0.6698,  0.9809,  0.8917],
        [ 0.1962,  0.8331, -0.9826, -0.7959,  0.1763,  0.5076],
        [ 0.9297,  0.0491,  0.9883,  0.2232, -0.8230, -0.2154],
        [ 0.9392,  0.3103,  0.9357, -0.4889, -0.3303, -0.8283],
        [ 0.9615,  0.2428,  0.5299,  0.3912, -0.9735, -0.9280],
        [ 0.9467,  0.3216, -0.9786,  0.1053, -0.9099, -0.8982],
        [-0.9776, -0.9156, -0.9765,  0.2152,  0.9664, -0.0901],
        [-0.9833, -0.9923, -0.9839, -0.8178,  0.9725,  0.6129],
        [ 0.8793, -0.1522,  0.4892,  0.0509,  0.8400,  0.9117],
        [ 0.9823,  0.6772,  0.7635, -0.0270, -0.9945, -0.8954]],
       device='cuda:0')
squash tensor([[ 3.1201,  1.5370,  1.9554,  0.0306, -1.5820, -1.9154],
        [ 2.8079, -0.1307, -0.9552, -0.1978, -0.2692, -1.6226],
        [-2.7929, -1.6652, -1.9278,  0.0796,  2.2192,  0.4384],
        [-0.4463, -2.8961, -2.0951, -0.9636,  2.4398,  1.5199],
        [ 0.7081,  0.0177, -0.1961, -0.0151,  1.3388,  0.9166],
        [ 2.0250,  0.8209,  1.8065, -0.0313, -0.7062,  0.4741],
        [ 2.6642, -0.7375,  1.7968,  0.4029, -0.6763, -1.0173],
        [ 2.5222, -0.4124,  1.6291,  1.0337, -1.0374, -1.2439],
        [ 0.9733, -0.8556, -0.9479,  0.3416, -1.5760, -2.1035],
        [-2.6825, -2.2113, -1.9786,  0.5281,  2.3786, -0.5820],
        [-2.1328, -3.1685, -1.9629, -0.8103,  2.3215,  1.4300],
        [ 0.1988,  1.1983, -2.3692, -1.0874,  0.1782,  0.5595],
        [ 1.6560,  0.0491,  2.5667,  0.2271, -1.1661, -0.2188],
        [ 1.7312,  0.3208,  1.7025, -0.5346, -0.3431, -1.1827],
        [ 1.9655,  0.2477,  0.5900,  0.4132, -2.1543, -1.6435],
        [ 1.7988,  0.3334, -2.2642,  0.1057, -1.5267, -1.4628],
        [-2.2396, -1.5611, -2.2164,  0.2187,  2.0347, -0.0903],
        [-2.3879, -2.7782, -2.4083, -1.1500,  2.1372,  0.7136],
        [ 1.3727, -0.1533,  0.5349,  0.0509,  1.2211,  1.5372],
        [ 2.3591,  0.8240,  1.0046, -0.0270, -2.9453, -1.4486]],
       device='cuda:0')
action: tensor([[ 0.9528,  0.6446,  0.9799,  0.6128, -0.9150, -0.9340],
        [ 0.9251, -0.2405, -0.9489,  0.4410, -0.9931, -0.5866],
        [-0.9699, -0.9776, -0.8882,  0.0506,  0.9856,  0.1894],
        [-0.9861, -0.9283, -0.9689, -0.1923,  0.9776,  0.9174],
        [ 0.9450,  0.3161, -0.9337, -0.6860,  0.4452, -0.3674],
        [ 0.9862,  0.3198,  0.9761,  0.5269, -0.6317, -0.7769],
        [ 0.9933,  0.0633,  0.9884,  0.7662, -0.7835, -0.8585],
        [ 0.9408, -0.2747, -0.1028,  0.6861, -0.9774, -0.9155],
        [-0.9953, -0.9906, -0.8871,  0.7326,  0.8023, -0.4691],
        [-0.9716, -0.9836, -0.9632, -0.4256,  0.9774,  0.6731],
        [ 0.9649,  0.4913, -0.9105, -0.6769,  0.2881,  0.1442],
        [ 0.9897, -0.6807,  0.9391, -0.0201, -0.8692, -0.5077],
        [ 0.9721,  0.5983,  0.9437, -0.4200, -0.5826,  0.5038],
        [ 0.9987,  0.2000,  0.1287,  0.2292, -0.9691, -0.5371],
        [ 0.8853, -0.0465, -0.8535,  0.3866, -0.9723, -0.8614],
        [-0.9780, -0.9626, -0.7950,  0.0045,  0.9975,  0.4355],
        [-0.9940, -0.9756, -0.9427, -0.1429,  0.9783,  0.9979],
        [ 0.7583, -0.1504, -0.7338,  0.3276,  0.8731,  0.5691],
        [ 0.9871, -0.3928,  0.9960,  0.2933, -0.8912,  0.3888],
        [ 0.9348, -0.2742,  0.9950, -0.7037, -0.8038, -0.8435]],
       device='cuda:0')
squash tensor([[ 1.8614,  0.7660,  2.2947,  0.7134, -1.5573, -1.6892],
        [ 1.6234, -0.2453, -1.8203,  0.4735, -2.8316, -0.6725],
        [-2.0899, -2.2401, -1.4135,  0.0506,  2.4649,  0.1917],
        [-2.4807, -1.6461, -2.0735, -0.1947,  2.2406,  1.5726],
        [ 1.7830,  0.3274, -1.6863, -0.8404,  0.4787, -0.3854],
        [ 2.4832,  0.3315,  2.2077,  0.5858, -0.7442, -1.0375],
        [ 2.8498,  0.0634,  2.5733,  1.0112, -1.0544, -1.2875],
        [ 1.7454, -0.2820, -0.1031,  0.8406, -2.2362, -1.5608],
        [-3.0285, -2.6777, -1.4079,  0.9343,  1.1050, -0.5089],
        [-2.1201, -2.3974, -1.9883, -0.4545,  2.2362,  0.8163],
        [ 2.0125,  0.5378, -1.5302, -0.8234,  0.2965,  0.1452],
        [ 2.6323, -0.8305,  1.7302, -0.0201, -1.3299, -0.5597],
        [ 2.1297,  0.6905,  1.7704, -0.4477, -0.6663,  0.5544],
        [ 3.6717,  0.2027,  0.1294,  0.2333, -2.0771, -0.6000],
        [ 1.3998, -0.0465, -1.2691,  0.4077, -2.1334, -1.2987],
        [-2.2494, -1.9807, -1.0848,  0.0045,  3.3332,  0.4666],
        [-2.9033, -2.1963, -1.7618, -0.1439,  2.2554,  3.4212],
        [ 0.9921, -0.1515, -0.9370,  0.3402,  1.3458,  0.6462],
        [ 2.5168, -0.4151,  3.1082,  0.3022, -1.4277,  0.4104],
        [ 1.6954, -0.2814,  2.9909, -0.8746, -1.1091, -1.2331]],
       device='cuda:0')
action: tensor([[-0.9888, -0.9971, -0.9171, -0.3249,  0.9865,  0.2709],
        [-0.9488, -0.9838, -0.9300, -0.9005,  0.9901,  0.9032],
        [ 0.9612,  0.1317,  0.0485, -0.0053,  0.8936,  0.8050],
        [ 0.9636, -0.2619,  0.9934, -0.1199, -0.8135, -0.6069],
        [ 0.9950,  0.0788,  0.9942,  0.6826, -0.9496, -0.9285],
        [ 0.9277, -0.0653, -0.9209,  0.9788, -0.9043, -0.1043],
        [-0.9888, -0.9800, -0.9773,  0.8693,  0.9660,  0.8021],
        [-0.9542, -0.9899, -0.9716, -0.1417,  0.9593,  0.8871],
        [ 0.9136,  0.9156, -0.9604, -0.0689,  0.1967, -0.7428],
        [ 0.9185, -0.3807,  0.9937, -0.0868, -0.7827, -0.6397],
        [ 0.9710, -0.1799,  0.9964, -0.1653, -0.5846, -0.7532],
        [ 0.9735,  0.1773, -0.2741,  0.7812, -0.9669, -0.4811],
        [ 0.7262,  0.0952, -0.8961, -0.1040, -0.7110, -0.8998],
        [-0.9886, -0.9910, -0.9749,  0.5029,  0.7373,  0.5282],
        [-0.9264, -0.8706, -0.9894, -0.9188,  0.9428,  0.8054],
        [ 0.6418,  0.6560, -0.5483,  0.0964,  0.3230,  0.3867],
        [ 0.9753, -0.0420,  0.9915,  0.6125, -0.8835, -0.8154],
        [ 0.9622,  0.0381,  0.9876,  0.4735, -0.9301, -0.7563],
        [ 0.9586,  0.4564, -0.7931,  0.9495, -0.9895, -0.4578],
        [-0.9824, -0.9842, -0.9905,  0.9105,  0.9844,  0.9814]],
       device='cuda:0')
squash tensor([[-2.5917, -3.2592, -1.5707, -0.3371,  2.4943,  0.2779],
        [-1.8192, -2.4043, -1.6584, -1.4747,  2.6499,  1.4891],
        [ 1.9609,  0.1325,  0.0485, -0.0053,  1.4398,  1.1128],
        [ 1.9944, -0.2681,  2.8522, -0.1205, -1.1374, -0.7039],
        [ 2.9988,  0.0790,  2.9194,  0.8340, -1.8275, -1.6472],
        [ 1.6417, -0.0654, -1.5952,  2.2684, -1.4953, -0.1047],
        [-2.5901, -2.2985, -2.2333,  1.3303,  2.0292,  1.1045],
        [-1.8768, -2.6403, -2.1204, -0.1427,  1.9368,  1.4080],
        [ 1.5489,  1.5612, -1.9515, -0.0690,  0.1993, -0.9568],
        [ 1.5796, -0.4009,  2.8812, -0.0870, -1.0523, -0.7576],
        [ 2.1098, -0.1819,  3.1641, -0.1668, -0.6695, -0.9803],
        [ 2.1560,  0.1792, -0.2812,  1.0484, -2.0424, -0.5244],
        [ 0.9206,  0.0954, -1.4523, -0.1044, -0.8893, -1.4714],
        [-2.5805, -2.6984, -2.1827,  0.5532,  0.9446,  0.5876],
        [-1.6322, -1.3357, -2.6186, -1.5815,  1.7626,  1.1137],
        [ 0.7612,  0.7857, -0.6160,  0.0967,  0.3350,  0.4079],
        [ 2.1904, -0.0420,  2.7293,  0.7129, -1.3915, -1.1430],
        [ 1.9747,  0.0381,  2.5396,  0.5146, -1.6594, -0.9875],
        [ 1.9277,  0.4927, -1.0796,  1.8267, -2.6243, -0.4945],
        [-2.3616, -2.4157, -2.6735,  1.5306,  2.4218,  2.3340]],
       device='cuda:0')
action: tensor([[ 0.4660,  0.7466, -0.9798, -0.5543, -0.0167,  0.9535],
        [ 0.9809,  0.7959,  0.9393,  0.4274, -0.9492,  0.1612],
        [ 0.9339,  0.2129,  0.9589,  0.7217, -0.8196,  0.5513],
        [ 0.9584, -0.4680, -0.9471,  0.7982, -0.9133, -0.8836],
        [-0.9787, -0.9343, -0.9714,  0.6177,  0.9704, -0.5443],
        [-0.8804, -0.9719, -0.9341, -0.9779,  0.8161, -0.8463],
        [-0.2007,  0.4271, -0.8515, -0.9570,  0.8723,  0.8962],
        [ 0.9915, -0.3275,  0.9926, -0.0396, -0.8967, -0.8351],
        [ 0.9813, -0.1035,  0.9634,  0.6920, -0.8888, -0.7804],
        [ 0.5647, -0.8874, -0.9533,  0.9657, -0.5941, -0.5122],
        [-0.9905, -0.9844, -0.9160,  0.8796,  0.9383,  0.8221],
        [-0.8077, -0.9131, -0.9123, -0.5811,  0.6543,  0.5080],
        [ 0.1604,  0.8330, -0.9850, -0.4788,  0.5801,  0.0153],
        [ 0.9854,  0.4839,  0.9749,  0.4958, -0.8719, -0.0643],
        [ 0.9843,  0.1353,  0.9561,  0.3771, -0.9229, -0.9082],
        [ 0.9269,  0.7625,  0.8141,  0.3511, -0.9043, -0.1322],
        [ 0.8435,  0.0360, -0.9079,  0.5873, -0.9167, -0.8743],
        [-0.8957, -0.9775, -0.8425,  0.3687,  0.9385,  0.2921],
        [-0.9773, -0.9717, -0.8194, -0.8211,  0.9826,  0.8803],
        [ 0.0530,  0.7925, -0.8325,  0.1805,  0.3407,  0.7232]],
       device='cuda:0')
squash tensor([[ 0.5050,  0.9651, -2.2925, -0.6246, -0.0167,  1.8692],
        [ 2.3214,  1.0874,  1.7317,  0.4567, -1.8241,  0.1626],
        [ 1.6882,  0.2162,  1.9326,  0.9113, -1.1555,  0.6202],
        [ 1.9261, -0.5075, -1.8031,  1.0937, -1.5468, -1.3918],
        [-2.2665, -1.6911, -2.1170,  0.7213,  2.0989, -0.6102],
        [-1.3777, -2.1252, -1.6896, -2.2469,  1.1451, -1.2429],
        [-0.2034,  0.4564, -1.2618, -1.9095,  1.3427,  1.4526],
        [ 2.7290, -0.3400,  2.8010, -0.0396, -1.4552, -1.2047],
        [ 2.3307, -0.1038,  1.9915,  0.8517, -1.4161, -1.0464],
        [ 0.6398, -1.4096, -1.8667,  2.0239, -0.6840, -0.5657],
        [-2.6723, -2.4238, -1.5633,  1.3738,  1.7237,  1.1631],
        [-1.1205, -1.5456, -1.5413, -0.6641,  0.7827,  0.5601],
        [ 0.1618,  1.1978, -2.4428, -0.5214,  0.6626,  0.0153],
        [ 2.4573,  0.5280,  2.1821,  0.5437, -1.3411, -0.0644],
        [ 2.4203,  0.1362,  1.8989,  0.3967, -1.6081, -1.5170],
        [ 1.6357,  1.0021,  1.1392,  0.3667, -1.4954, -0.1330],
        [ 1.2333,  0.0361, -1.5154,  0.6736, -1.5678, -1.3509],
        [-1.4501, -2.2379, -1.2298,  0.3869,  1.7255,  0.3009],
        [-2.2332, -2.1211, -1.1550, -1.1602,  2.3687,  1.3770],
        [ 0.0531,  1.0782, -1.1963,  0.1825,  0.3549,  0.9143]],
       device='cuda:0')
action: tensor([[-0.7832, -0.9857, -0.9610, -0.7244,  0.9654,  0.7816],
        [ 0.8646,  0.3287, -0.2594, -0.0861,  0.8310,  0.5343],
        [ 0.9656, -0.0413,  0.9940,  0.4036, -0.9251, -0.8201],
        [ 0.9745,  0.2944,  0.9937, -0.5327, -0.9902, -0.7676],
        [ 0.9377,  0.7403,  0.2259,  0.4832, -0.4470, -0.6947],
        [-0.9636, -0.8464, -0.9033,  0.6419,  0.9853,  0.9264],
        [-0.9951, -0.9910, -0.9431, -0.2805,  0.9974,  0.7777],
        [ 0.7575, -0.1825,  0.3426, -0.0292,  0.3416,  0.6926],
        [ 0.9741,  0.9851,  0.8017, -0.3707, -0.9353,  0.2806],
        [-0.9873,  0.3502, -0.7404,  0.5818,  0.3020,  0.0069],
        [-0.9049,  0.6331, -0.6587, -0.6237,  0.2651,  0.4350],
        [-0.7712,  0.7298, -0.9721, -0.8729, -0.8312,  0.4964],
        [ 0.1977,  0.7332, -0.8179, -0.9904, -0.4215, -0.8885],
        [ 0.9839, -0.9654,  0.9294, -0.8739, -0.9656, -0.9022],
        [ 0.9928,  0.2260, -0.7484,  0.6847, -0.9963, -0.8921],
        [-0.9625, -0.9393, -0.9845,  0.7809,  0.9821,  0.9935],
        [-0.9711, -0.9836, -0.9576, -0.8486,  0.9088,  0.7342],
        [ 0.7087,  0.9837, -0.7930,  0.3121,  0.4600,  0.6898],
        [ 0.9897,  0.3707,  0.9657,  0.4059, -0.7382, -0.9358],
        [ 0.9584,  0.8129,  0.9708,  0.7557, -0.9590, -0.8469]],
       device='cuda:0')
squash tensor([[-1.0535, -2.4659, -1.9587, -0.9169,  2.0203,  1.0496],
        [ 1.3112,  0.3414, -0.2654, -0.0864,  1.1914,  0.5961],
        [ 2.0221, -0.0413,  2.9053,  0.4280, -1.6230, -1.1572],
        [ 2.1745,  0.3033,  2.8815, -0.5939, -2.6575, -1.0145],
        [ 1.7190,  0.9511,  0.2299,  0.5271, -0.4810, -0.8570],
        [-1.9944, -1.2435, -1.4897,  0.7615,  2.4531,  1.6323],
        [-3.0030, -2.7014, -1.7655, -0.2882,  3.3269,  1.0394],
        [ 0.9903, -0.1845,  0.3571, -0.0292,  0.3559,  0.8530],
        [ 2.1665,  2.4465,  1.1032, -0.3892, -1.6994,  0.2883],
        [-2.5279,  0.3657, -0.9513,  0.6652,  0.3117,  0.0069],
        [-1.4985,  0.7466, -0.7905, -0.7311,  0.2716,  0.4661],
        [-1.0233,  0.9284, -2.1283, -1.3452, -1.1919,  0.5445],
        [ 0.2004,  0.9356, -1.1504, -2.6691, -0.4496, -1.4149],
        [ 2.4057, -2.0194,  1.6541, -1.3493, -2.0226, -1.4838],
        [ 2.8092,  0.2300, -0.9694,  0.8379, -3.1498, -1.4319],
        [-1.9791, -1.7323, -2.4255,  1.0478,  2.3530,  2.8647],
        [-2.1118, -2.3975, -1.9159, -1.2510,  1.5207,  0.9379],
        [ 0.8846,  2.3997, -1.0795,  0.3228,  0.4973,  0.8476],
        [ 2.6296,  0.3892,  2.0240,  0.4306, -0.9465, -1.7031],
        [ 1.9256,  1.1356,  2.1067,  0.9861, -1.9335, -1.2452]],
       device='cuda:0')
action: tensor([[ 0.9023,  0.7043, -0.9525, -0.7858,  0.2386,  0.3090],
        [ 0.9394, -0.2969,  0.9563,  0.3852, -0.9452, -0.8569],
        [ 0.9754, -0.1608,  0.8916,  0.6729, -0.8983, -0.7388],
        [ 0.9631, -0.4012, -0.6490,  0.9619, -0.8711, -0.5588],
        [-0.9876, -0.9920, -0.9523,  0.5933,  0.9395,  0.0848],
        [-0.9809, -0.9884, -0.9765, -0.2216,  0.9227,  0.7777],
        [ 0.1681,  0.9012, -0.7821, -0.8588,  0.3685, -0.3331],
        [ 0.9914,  0.2243,  0.9248,  0.5726, -0.6070, -0.0416],
        [ 0.9923,  0.5543,  0.9926,  0.3369, -0.5893, -0.3628],
        [ 0.9832,  0.0386,  0.4552,  0.0030, -0.7424, -0.8236],
        [ 0.9611, -0.4529, -0.8647,  0.5931, -0.9273, -0.9896],
        [-0.9937, -0.9775, -0.8795, -0.1140,  0.9781, -0.9373],
        [-0.9821, -0.9814, -0.8714, -0.5052,  0.9648,  0.8867],
        [ 0.3820,  0.9705, -0.9640, -0.9711,  0.0345,  0.6815],
        [ 0.9935,  0.1124,  0.9837,  0.1699, -0.7746, -0.0185],
        [ 0.9517,  0.0939,  0.9947,  0.1701, -0.7895, -0.7157],
        [ 0.9572,  0.1427,  0.7533,  0.5962, -0.9128, -0.8008],
        [-0.9247, -0.9685, -0.9957,  0.4705,  0.8518, -0.3742],
        [-0.9375, -0.9527, -0.9871, -0.2666,  0.8208,  0.8781],
        [ 0.7459,  0.7054, -0.8833, -0.8520,  0.5847,  0.8908]],
       device='cuda:0')
squash tensor([[ 1.4845e+00,  8.7586e-01, -1.8577e+00, -1.0605e+00,  2.4331e-01,
          3.1947e-01],
        [ 1.7332e+00, -3.0617e-01,  1.9008e+00,  4.0613e-01, -1.7850e+00,
         -1.2815e+00],
        [ 2.1936e+00, -1.6222e-01,  1.4295e+00,  8.1594e-01, -1.4635e+00,
         -9.4788e-01],
        [ 1.9865e+00, -4.2508e-01, -7.7358e-01,  1.9703e+00, -1.3377e+00,
         -6.3110e-01],
        [-2.5373e+00, -2.7580e+00, -1.8559e+00,  6.8277e-01,  1.7340e+00,
          8.5022e-02],
        [-2.3197e+00, -2.5723e+00, -2.2164e+00, -2.2530e-01,  1.6069e+00,
          1.0394e+00],
        [ 1.6973e-01,  1.4788e+00, -1.0508e+00, -1.2886e+00,  3.8667e-01,
         -3.4628e-01],
        [ 2.7212e+00,  2.2817e-01,  1.6209e+00,  6.5137e-01, -7.0419e-01,
         -4.1587e-02],
        [ 2.7801e+00,  6.2461e-01,  2.7959e+00,  3.5056e-01, -6.7664e-01,
         -3.8014e-01],
        [ 2.3850e+00,  3.8599e-02,  4.9120e-01,  2.9700e-03, -9.5587e-01,
         -1.1678e+00],
        [ 1.9607e+00, -4.8837e-01, -1.3119e+00,  6.8246e-01, -1.6386e+00,
         -2.6263e+00],
        [-2.8749e+00, -2.2370e+00, -1.3734e+00, -1.1450e-01,  2.2515e+00,
         -1.7154e+00],
        [-2.3547e+00, -2.3344e+00, -1.3390e+00, -5.5623e-01,  2.0114e+00,
          1.4064e+00],
        [ 4.0239e-01,  2.1005e+00, -1.9994e+00, -2.1104e+00,  3.4559e-02,
          8.3198e-01],
        [ 2.8625e+00,  1.1290e-01,  2.4021e+00,  1.7160e-01, -1.0318e+00,
         -1.8543e-02],
        [ 1.8496e+00,  9.4190e-02,  2.9615e+00,  1.7177e-01, -1.0700e+00,
         -8.9886e-01],
        [ 1.9118e+00,  1.4371e-01,  9.8053e-01,  6.8717e-01, -1.5439e+00,
         -1.1008e+00],
        [-1.6206e+00, -2.0669e+00, -3.0655e+00,  5.1066e-01,  1.2628e+00,
         -3.9328e-01],
        [-1.7174e+00, -1.8606e+00, -2.5192e+00, -2.7325e-01,  1.1592e+00,
          1.3675e+00],
        [ 9.6360e-01,  8.7792e-01, -1.3908e+00, -1.2633e+00,  6.6965e-01,
          1.4257e+00]], device='cuda:0')
action: tensor([[-0.9433, -0.9333, -0.9705,  0.3386,  0.8355,  0.7675],
        [-0.9455, -0.9504, -0.9484, -0.6474,  0.9897,  0.9675],
        [ 0.8883,  0.4367,  0.1996,  0.6406,  0.6152,  0.5010],
        [ 0.9703,  0.5735,  0.9099,  0.1609, -0.9959, -0.9438],
        [ 0.9558,  0.6451,  0.9790,  0.0554, -0.9835, -0.9170],
        [ 0.9891,  0.6902, -0.6736,  0.5254, -0.9424, -0.6417],
        [-0.9991, -0.7740, -0.9858,  0.7043,  0.9846,  0.9671],
        [-0.8376, -0.9851, -0.9288, -0.1808,  0.9551,  0.8929],
        [ 0.8266,  0.0411, -0.8359, -0.7292,  0.8788,  0.6091],
        [ 0.9855, -0.1606,  0.9963,  0.9075,  0.2690,  0.9565],
        [ 0.3306, -0.5318,  0.5386,  0.1734, -0.1214,  0.3173],
        [ 0.9350,  0.7174,  0.9898, -0.1613, -0.1881, -0.4264],
        [ 0.8778, -0.0410,  0.9839,  0.0912, -0.5099, -0.9072],
        [ 0.9289, -0.2666,  0.2284, -0.3464, -0.6554, -0.7979],
        [ 0.8069, -0.5593, -0.4484, -0.3076, -0.7705, -0.9032],
        [-0.9979, -0.9516, -0.9493,  0.2794,  0.9539, -0.9342],
        [-0.9369, -0.9862, -0.8916, -0.5238,  0.9860,  0.8381],
        [-0.8911, -0.0158, -0.8221, -0.9605,  0.5574,  0.4435],
        [ 0.9374,  0.9784,  0.4715, -0.3453, -0.9438, -0.7997],
        [ 0.9610,  0.5006,  0.7951,  0.4891, -0.9581, -0.8237]],
       device='cuda:0')
squash tensor([[-1.7668, -1.6832, -2.1013,  0.3525,  1.2062,  1.0142],
        [-1.7871, -1.8358, -1.8159, -0.7708,  2.6339,  2.0511],
        [ 1.4137,  0.4681,  0.2023,  0.7591,  0.7173,  0.5506],
        [ 2.0971,  0.6527,  1.5269,  0.1624, -3.0993, -1.7721],
        [ 1.8953,  0.7668,  2.2732,  0.0555, -2.3961, -1.5701],
        [ 2.6024,  0.8483, -0.8173,  0.5837, -1.7589, -0.7610],
        [-3.8439, -1.0302, -2.4687,  0.8757,  2.4284,  2.0449],
        [-1.2129, -2.4451, -1.6493, -0.1828,  1.8874,  1.4359],
        [ 1.1773,  0.0411, -1.2073, -0.9269,  1.3703,  0.7076],
        [ 2.4584, -0.1620,  3.1439,  1.5132,  0.2758,  1.9031],
        [ 0.3435, -0.5927,  0.6022,  0.1751, -0.1220,  0.3287],
        [ 1.6965,  0.9024,  2.6383, -0.1628, -0.1904, -0.4555],
        [ 1.3661, -0.0410,  2.4061,  0.0914, -0.5626, -1.5113],
        [ 1.6503, -0.2733,  0.2325, -0.3614, -0.7847, -1.0927],
        [ 1.1180, -0.6318, -0.4827, -0.3179, -1.0215, -1.4893],
        [-3.4381, -1.8489, -1.8245,  0.2870,  1.8738, -1.6908],
        [-1.7123, -2.4836, -1.4296, -0.5815,  2.4785,  1.2146],
        [-1.4275, -0.0158, -1.1632, -1.9519,  0.6291,  0.4765],
        [ 1.7161,  2.2577,  0.5119, -0.3600, -1.7721, -1.0978],
        [ 1.9583,  0.5501,  1.0853,  0.5348, -1.9226, -1.1683]],
       device='cuda:0')
action: tensor([[-0.9725, -0.9951, -0.9795, -0.8679,  0.8037,  0.5772],
        [ 0.6491,  0.9901, -0.9774, -0.8199, -0.2923, -0.2806],
        [ 0.9358,  0.2734,  0.9734,  0.6716, -0.4819,  0.5896],
        [ 0.8703,  0.3491,  0.9415, -0.3193, -0.7214,  0.1927],
        [ 0.9858,  0.8186,  0.8624, -0.0609, -0.9214, -0.9680],
        [ 0.8546,  0.3627, -0.6341,  0.3152, -0.9176, -0.9076],
        [-0.9960, -0.9755, -0.9678, -0.0423,  0.9579, -0.5189],
        [-0.9963, -0.9617, -0.9471, -0.3032,  0.9938,  0.9687],
        [ 0.1469, -0.0168, -0.7686, -0.1913,  0.8972,  0.6746],
        [ 0.9891,  0.2631,  0.9553,  0.3980, -0.7672, -0.8546],
        [ 0.9346, -0.3561,  0.9631, -0.0259, -0.9678, -0.3221],
        [ 0.9842,  0.3873,  0.9312,  0.6949, -0.9964, -0.5044],
        [ 0.8807, -0.1664, -0.8387,  0.4576, -0.9616, -0.5402],
        [-0.9943, -0.9825, -0.9819,  0.5961,  0.9718,  0.7925],
        [-0.9914, -0.9870, -0.9709, -0.7849,  0.9724,  0.9723],
        [ 0.8032,  0.8091, -0.9281, -0.0681,  0.1178,  0.0382],
        [ 0.9958, -0.0615,  0.9922,  0.5210, -0.8613, -0.1127],
        [ 0.9487,  0.4649,  0.9921,  0.2190, -0.9903, -0.3297],
        [ 0.9727,  0.6023, -0.7705,  0.5495, -0.9250, -0.8749],
        [-0.9905, -0.8563, -0.9180,  0.6611,  0.9817,  0.8600]],
       device='cuda:0')
squash tensor([[-2.1364, -3.0012, -2.2840, -1.3245,  1.1090,  0.6583],
        [ 0.7737,  2.6514, -2.2359, -1.1565, -0.3011, -0.2883],
        [ 1.7035,  0.2806,  2.1527,  0.8136, -0.5254,  0.6771],
        [ 1.3344,  0.3644,  1.7512, -0.3309, -0.9105,  0.1952],
        [ 2.4710,  1.1526,  1.3028, -0.0610, -1.5981, -2.0593],
        [ 1.2728,  0.3800, -0.7483,  0.3263, -1.5733, -1.5137],
        [-3.1059, -2.1942, -2.0558, -0.0423,  1.9197, -0.5749],
        [-3.1465, -1.9681, -1.8024, -0.3131,  2.8831,  2.0704],
        [ 0.1479, -0.0168, -1.0168, -0.1937,  1.4578,  0.8191],
        [ 2.6010,  0.2694,  1.8897,  0.4213, -1.0136, -1.2730],
        [ 1.6934, -0.3724,  1.9875, -0.0259, -2.0560, -0.3339],
        [ 2.4157,  0.4086,  1.6675,  0.8574, -3.1558, -0.5552],
        [ 1.3788, -0.1680, -1.2167,  0.4942, -1.9663, -0.6045],
        [-2.9275, -2.3644, -2.3488,  0.6870,  2.1228,  1.0780],
        [-2.7204, -2.5149, -2.1072, -1.0581,  2.1352,  2.1325],
        [ 1.1077,  1.1244, -1.6446, -0.0682,  0.1184,  0.0382],
        [ 3.0848, -0.0615,  2.7735,  0.5777, -1.2982, -0.1132],
        [ 1.8185,  0.5035,  2.7655,  0.2226, -2.6642, -0.3425],
        [ 2.1406,  0.6967, -1.0215,  0.6177, -1.6228, -1.3538],
        [-2.6704, -1.2791, -1.5761,  0.7947,  2.3437,  1.2932]],
       device='cuda:0')
action: tensor([[-0.9670, -0.7205, -0.9773, -0.4761,  0.9907,  0.7115],
        [ 0.8577,  0.3177,  0.0579,  0.1824,  0.9795,  0.1694],
        [ 0.9977,  0.3389,  0.9935,  0.4836, -0.9616, -0.6792],
        [ 0.9935,  0.3049,  0.9654,  0.3043, -0.4666, -0.6279],
        [ 0.8153,  0.1925,  0.4990,  0.7538, -0.8589, -0.8598],
        [-0.9747, -0.9722, -0.9385,  0.9266,  0.9616,  0.9479],
        [-0.9797, -0.9912, -0.9924,  0.2179,  0.9757,  0.8489],
        [ 0.9230,  0.6071, -0.9208, -0.6362, -0.0742,  0.3899],
        [ 0.9737, -0.2116,  0.9800,  0.7451, -0.8857,  0.2443],
        [ 0.9884, -0.5493,  0.8611,  0.7424, -0.7580, -0.9581],
        [ 0.9447, -0.7700,  0.5223,  0.8841, -0.2994, -0.6265],
        [-0.9707, -0.8747, -0.9377,  0.3008,  0.9131, -0.9248],
        [-0.8987, -0.9810, -0.8889, -0.5669,  0.6746,  0.6946],
        [-0.1411,  0.1215, -0.4022, -0.9217,  0.6332,  0.6925],
        [ 0.9856,  0.0860,  0.9907,  0.3058, -0.9388, -0.8863],
        [ 0.9790,  0.5146,  0.7533,  0.7454, -0.9716, -0.8898],
        [ 0.9231, -0.9657, -0.8915,  0.9789, -0.6553, -0.6671],
        [-0.9838, -0.7861, -0.9885,  0.9982,  0.9835,  0.9040],
        [-0.9958, -0.9946, -0.9621, -0.4999,  0.9369, -0.4970],
        [-0.0127,  0.9578, -0.8915, -0.5202, -0.1463,  0.1874]],
       device='cuda:0')
squash tensor([[-2.0438, -0.9086, -2.2332, -0.5180,  2.6830,  0.8901],
        [ 1.2845,  0.3291,  0.0580,  0.1845,  2.2859,  0.1710],
        [ 3.3885,  0.3528,  2.8612,  0.5277, -1.9672, -0.8277],
        [ 2.8614,  0.3150,  2.0194,  0.3143, -0.5057, -0.7380],
        [ 1.1426,  0.1949,  0.5480,  0.9816, -1.2891, -1.2925],
        [-2.1793, -2.1306, -1.7257,  1.6340,  1.9671,  1.8106],
        [-2.2912, -2.7083, -2.7863,  0.2214,  2.1986,  1.2523],
        [ 1.6089,  0.7043, -1.5945, -0.7517, -0.0744,  0.4116],
        [ 2.1594, -0.2149,  2.2979,  0.9620, -1.4017,  0.2493],
        [ 2.5717, -0.6173,  1.2976,  0.9559, -0.9915, -1.9221],
        [ 1.7797, -1.0202,  0.5795,  1.3944, -0.3089, -0.7356],
        [-2.1037, -1.3527, -1.7186,  0.3104,  1.5462, -1.6215],
        [-1.4656, -2.3233, -1.4168, -0.6429,  0.8192,  0.8568],
        [-0.1420,  0.1221, -0.4263, -1.6004,  0.7468,  0.8527],
        [ 2.4643,  0.0862,  2.6813,  0.3159, -1.7282, -1.4043],
        [ 2.2723,  0.5690,  0.9806,  0.9624, -2.1195, -1.4208],
        [ 1.6098, -2.0236, -1.4291,  2.2708, -0.7845, -0.8056],
        [-2.4042, -1.0610, -2.5765,  3.5146,  2.3933,  1.4936],
        [-3.0770, -2.9513, -1.9739, -0.5492,  1.7118, -0.5453],
        [-0.0127,  1.9191, -1.4290, -0.5766, -0.1474,  0.1897]],
       device='cuda:0')
action: tensor([[ 6.6488e-01,  8.4354e-01, -9.5179e-01, -9.5974e-01, -1.0899e-01,
         -5.7290e-01],
        [ 9.9826e-01, -4.2591e-01,  9.8840e-01, -9.3351e-01, -9.6314e-01,
         -7.9975e-01],
        [ 9.9927e-01,  9.1420e-01,  2.0340e-01, -3.4197e-01, -9.3622e-01,
         -9.1497e-01],
        [-9.8476e-01, -6.1497e-01, -9.1062e-01,  8.1447e-01,  9.8941e-01,
          9.8262e-01],
        [-9.8664e-01, -9.9732e-01, -9.6432e-01, -4.1037e-01,  9.7134e-01,
          9.7051e-01],
        [ 9.0226e-01,  2.2419e-01, -7.1320e-01,  4.4649e-01,  8.5810e-01,
          8.7338e-01],
        [ 9.7186e-01,  5.3031e-02,  9.7812e-01,  5.8539e-05, -8.2264e-01,
         -4.0339e-01],
        [ 9.8610e-01, -5.2601e-01,  9.7440e-01, -3.8694e-01, -9.6198e-01,
         -9.3019e-01],
        [ 9.9854e-01,  6.1427e-01,  9.9688e-01,  6.2925e-01, -8.6981e-01,
         -7.4870e-01],
        [ 9.7046e-01,  4.0898e-01, -9.1178e-01,  3.4531e-02, -8.3274e-01,
         -9.6690e-01],
        [-9.8222e-01, -9.1924e-01, -9.2489e-01,  2.0837e-01,  9.7712e-01,
          7.8130e-01],
        [-9.3854e-01, -9.9199e-01, -8.9904e-01, -6.0727e-01,  9.2499e-01,
          7.0683e-01],
        [ 5.8537e-01,  6.3537e-01, -2.3744e-01, -3.4507e-01,  7.7349e-01,
         -3.4656e-01],
        [ 9.9819e-01, -3.0704e-01,  9.8934e-01,  2.8509e-01, -9.2744e-01,
         -8.7410e-01],
        [ 9.8798e-01,  6.2810e-01,  9.9620e-01,  3.0060e-01, -9.6159e-01,
         -8.0680e-01],
        [ 8.9332e-01, -4.7117e-01, -9.6801e-01,  8.6493e-01, -9.3468e-01,
          7.1511e-01],
        [-9.6862e-01, -9.7715e-01, -9.9619e-01,  8.2982e-01,  9.7379e-01,
          9.1127e-01],
        [-9.6713e-01, -9.9117e-01, -9.6942e-01, -6.7230e-01,  9.0196e-01,
          7.6076e-01],
        [ 9.0005e-01,  4.3353e-01, -9.7387e-01, -1.2403e-01,  6.6876e-01,
          8.9582e-01],
        [ 9.8801e-01, -5.5377e-02,  8.9481e-01,  2.8179e-01, -6.8308e-01,
         -4.1210e-01]], device='cuda:0')
squash tensor([[ 8.0152e-01,  1.2333e+00, -1.8505e+00, -1.9427e+00, -1.0943e-01,
         -6.5183e-01],
        [ 3.5240e+00, -4.5488e-01,  2.5719e+00, -1.6851e+00, -1.9876e+00,
         -1.0979e+00],
        [ 3.9594e+00,  1.5525e+00,  2.0627e-01, -3.5632e-01, -1.7065e+00,
         -1.5572e+00],
        [-2.4345e+00, -7.1687e-01, -1.5311e+00,  1.1402e+00,  2.6178e+00,
          2.3686e+00],
        [-2.5008e+00, -3.3078e+00, -2.0042e+00, -4.3605e-01,  2.1155e+00,
          2.1009e+00],
        [ 1.4843e+00,  2.2807e-01, -8.9367e-01,  4.8031e-01,  1.2861e+00,
          1.3472e+00],
        [ 2.1248e+00,  5.3081e-02,  2.2521e+00,  5.8539e-05, -1.1649e+00,
         -4.2769e-01],
        [ 2.4809e+00, -5.8461e-01,  2.1727e+00, -4.0820e-01, -1.9717e+00,
         -1.6598e+00],
        [ 3.6118e+00,  7.1576e-01,  3.2312e+00,  7.4018e-01, -1.3323e+00,
         -9.6999e-01],
        [ 2.1001e+00,  4.3438e-01, -1.5380e+00,  3.4545e-02, -1.1970e+00,
         -2.0423e+00],
        [-2.3571e+00, -1.5841e+00, -1.6219e+00,  2.1146e-01,  2.2295e+00,
          1.0487e+00],
        [-1.7256e+00, -2.7583e+00, -1.4672e+00, -7.0459e-01,  1.6225e+00,
          8.8082e-01],
        [ 6.7059e-01,  7.5037e-01, -2.4206e-01, -3.5983e-01,  1.0289e+00,
         -3.6153e-01],
        [ 3.5028e+00, -3.1727e-01,  2.6144e+00,  2.9321e-01, -1.6398e+00,
         -1.3502e+00],
        [ 2.5542e+00,  7.3828e-01,  3.1316e+00,  3.1017e-01, -1.9666e+00,
         -1.1178e+00],
        [ 1.4381e+00, -5.1158e-01, -2.0597e+00,  1.3126e+00, -1.6942e+00,
          8.9756e-01],
        [-2.0694e+00, -2.2303e+00, -3.1303e+00,  1.1876e+00,  2.1608e+00,
          1.5349e+00],
        [-2.0459e+00, -2.7089e+00, -2.0825e+00, -8.1493e-01,  1.4826e+00,
          9.9802e-01],
        [ 1.4725e+00,  4.6423e-01, -2.1624e+00, -1.2468e-01,  8.0849e-01,
          1.4506e+00],
        [ 2.5552e+00, -5.5434e-02,  1.4456e+00,  2.8963e-01, -8.3487e-01,
         -4.3814e-01]], device='cuda:0')
action: tensor([[-0.9861, -0.9662, -0.3469,  0.3625,  0.9953,  0.9430],
        [-0.9781, -0.9409, -0.9902,  0.1298,  0.9754,  0.3905],
        [ 0.8841, -0.1308, -0.7147,  0.4191,  0.8480, -0.1001],
        [ 0.9756,  0.0186,  0.9912,  0.2739, -0.5338, -0.7278],
        [ 0.9945, -0.5595,  0.9401, -0.3535, -0.9221,  0.2746],
        [ 0.9897,  0.6077,  0.9769,  0.4715, -0.9352, -0.9563],
        [ 0.9788,  0.5587, -0.7939,  0.3977, -0.9382, -0.8959],
        [-0.9746, -0.9479, -0.9718,  0.3021,  0.9867,  0.7500],
        [-0.9838, -0.9914, -0.9832, -0.7602,  0.9583,  0.9767],
        [ 0.8010,  0.4891, -0.4282,  0.1614,  0.8013,  0.7239],
        [ 0.9352, -0.4573,  0.9861,  0.5952, -0.9908, -0.8313],
        [ 0.6535, -0.5297,  0.2763,  0.9712, -0.9616,  0.2794],
        [-0.9788, -0.9330, -0.9633,  0.9932,  0.8835,  0.9336],
        [-0.9833, -0.9549, -0.8914,  0.6916,  0.9971,  0.9299],
        [ 0.7138,  0.1628, -0.8321,  0.0294,  0.1839,  0.3456],
        [ 0.9926,  0.8324,  0.7703,  0.5157, -0.9303, -0.1035],
        [ 0.4041, -0.9320,  0.8092,  0.5686,  0.3910, -0.1179],
        [-0.9874,  0.8153, -0.2796,  0.5770,  0.4193, -0.3457],
        [-0.8634,  0.9583, -0.7896, -0.8827, -0.7720,  0.9673],
        [ 0.9808,  0.9875, -0.8363, -0.9874, -0.8429, -0.6276]],
       device='cuda:0')
squash tensor([[-2.4810, -2.0321, -0.3619,  0.3797,  3.0212,  1.7641],
        [-2.2518, -1.7460, -2.6543,  0.1306,  2.1935,  0.4124],
        [ 1.3941, -0.1316, -0.8967,  0.4466,  1.2492, -0.1004],
        [ 2.1960,  0.0186,  2.7093,  0.2811, -0.5955, -0.9240],
        [ 2.9454, -0.6321,  1.7392, -0.3695, -1.6030,  0.2819],
        [ 2.6320,  0.7053,  2.2256,  0.5120, -1.6986, -1.9008],
        [ 2.2679,  0.6310, -1.0820,  0.4210, -1.7229, -1.4511],
        [-2.1764, -1.8107, -2.1238,  0.3118,  2.5051,  0.9731],
        [-2.4035, -2.7197, -2.3852, -0.9967,  1.9241,  2.2214],
        [ 1.1013,  0.5349, -0.4577,  0.1629,  1.1024,  0.9158],
        [ 1.6979, -0.4939,  2.4802,  0.6857, -2.6910, -1.1923],
        [ 0.7813, -0.5897,  0.2836,  2.1129, -1.9663,  0.2871],
        [-2.2677, -1.6808, -1.9900,  2.8401,  1.3916,  1.6861],
        [-2.3871, -1.8847, -1.4286,  0.8511,  3.2600,  1.6574],
        [ 0.8949,  0.1642, -1.1950,  0.0294,  0.1860,  0.3605],
        [ 2.7992,  1.1959,  1.0212,  0.5705, -1.6608, -0.1039],
        [ 0.4286, -1.6737,  1.1246,  0.6454,  0.4130, -0.1185],
        [-2.5318,  1.1427, -0.2872,  0.6579,  0.4468, -0.3606],
        [-1.3064,  1.9248, -1.0703, -1.3879, -1.0254,  2.0491],
        [ 2.3195,  2.5333, -1.2087, -2.5302, -1.2313, -0.7374]],
       device='cuda:0')
action: tensor([[ 0.9966,  0.6238,  0.9646,  0.4832, -0.9634, -0.9873],
        [ 0.9869,  0.1516, -0.6812, -0.1976, -0.9935, -0.9443],
        [-0.9947, -0.8534, -0.9413,  0.2757,  0.9333,  0.6244],
        [-0.9894, -0.9912, -0.9903, -0.3589,  0.9371,  0.9561],
        [ 0.6518,  0.4810, -0.9567, -0.6578,  0.7947,  0.8808],
        [ 0.9620, -0.1300,  0.9683,  0.5797, -0.4248, -0.5046],
        [ 0.4100, -0.0391,  0.6664,  0.6229, -0.6758, -0.4609],
        [ 0.7722, -0.7323, -0.6817,  0.5660, -0.5198, -0.8865],
        [-0.9923, -0.9802, -0.9823,  0.8753,  0.9606, -0.9061],
        [-0.9675, -0.9300, -0.9708, -0.9012,  0.9085, -0.1875],
        [ 0.1406,  0.9738, -0.9658, -0.9850, -0.8173, -0.6601],
        [ 0.9800,  0.9661,  0.5609,  0.4585, -0.9001, -0.6989],
        [ 0.9932,  0.5079,  0.9801, -0.1578, -0.5048, -0.2512],
        [ 0.9965,  0.8172,  0.6206, -0.3282, -0.8511, -0.9299],
        [ 0.9690,  0.5230, -0.9061,  0.4422, -0.7647, -0.7470],
        [-0.9837, -0.9909, -0.9157, -0.0114,  0.8565, -0.5268],
        [-0.9592, -0.9942, -0.9580, -0.1950,  0.9905,  0.8737],
        [ 0.7880,  0.6509, -0.8770, -0.7802,  0.5761,  0.8848],
        [ 0.9957,  0.1062,  0.9829,  0.4983, -0.9628, -0.6129],
        [ 0.9432,  0.3427,  0.4660,  0.7963, -0.8773,  0.3817]],
       device='cuda:0')
squash tensor([[ 3.1897,  0.7313,  2.0085,  0.5272, -1.9918, -2.5279],
        [ 2.5105,  0.1528, -0.8313, -0.2002, -2.8631, -1.7767],
        [-2.9666, -1.2685, -1.7491,  0.2830,  1.6834,  0.7321],
        [-2.6164, -2.7112, -2.6637, -0.3756,  1.7141,  1.8988],
        [ 0.7784,  0.5242, -1.9049, -0.7890,  1.0841,  1.3792],
        [ 1.9717, -0.1308,  2.0642,  0.6620, -0.4535, -0.5555],
        [ 0.4356, -0.0392,  0.8042,  0.7297, -0.8213, -0.4984],
        [ 1.0257, -0.9336, -0.8323,  0.6416, -0.5761, -1.4052],
        [-2.7805, -2.3025, -2.3580,  1.3555,  1.9541, -1.5054],
        [-2.0520, -1.6585, -2.1065, -1.4787,  1.5190, -0.1897],
        [ 0.1415,  2.1605, -2.0261, -2.4426, -1.1487, -0.7930],
        [ 2.2966,  2.0300,  0.6341,  0.4954, -1.4727, -0.8652],
        [ 2.8421,  0.5599,  2.2999, -0.1592, -0.5557, -0.2567],
        [ 3.1688,  1.1482,  0.7260, -0.3408, -1.2602, -1.6578],
        [ 2.0762,  0.5805, -1.5054,  0.4750, -1.0075, -0.9661],
        [-2.3995, -2.6953, -1.5615, -0.0114,  1.2802, -0.5856],
        [-1.9356, -2.9173, -1.9206, -0.1975,  2.6716,  1.3485],
        [ 1.0662,  0.7768, -1.3625, -1.0458,  0.6566,  1.3973],
        [ 3.0758,  0.1066,  2.3763,  0.5471, -1.9831, -0.7135],
        [ 1.7660,  0.3572,  0.5049,  1.0885, -1.3638,  0.4020]],
       device='cuda:0')
action: tensor([[ 0.9806,  0.3255,  0.9182,  0.4700, -0.9889, -0.8127],
        [ 0.9611, -0.3892, -0.8654,  0.9970, -0.9122,  0.6052],
        [-0.9951, -0.9576, -0.9853,  0.9891,  0.9826,  0.9428],
        [-0.8589, -0.9698, -0.9901, -0.1316,  0.4613,  0.6948],
        [ 0.8868,  0.1579, -0.7701, -0.3683,  0.8988,  0.0872],
        [ 0.9316, -0.0514,  0.9950,  0.8419,  0.1230,  0.6066],
        [-0.9893, -0.0887, -0.7665,  0.4112, -0.5244,  0.4162],
        [-0.8796,  0.9964, -0.9526, -0.8174, -0.0961,  0.7699],
        [ 0.9277,  0.9932, -0.9292, -0.9545, -0.9274, -0.8557],
        [ 0.9988, -0.2952,  0.9875, -0.9680, -0.9582, -0.7167],
        [ 0.9962,  0.6368, -0.5308,  0.5456, -0.9952, -0.9636],
        [-0.9889, -0.9663, -0.9778,  0.3081,  0.9705,  0.9573],
        [-0.9225, -0.9845, -0.9354, -0.7455,  0.9588,  0.9375],
        [ 0.8192,  0.6990, -0.8609,  0.1409,  0.7946,  0.5399],
        [ 0.9873, -0.4156,  0.9753,  0.6207, -0.9923, -0.9349],
        [ 0.9806,  0.4583,  0.9714, -0.1002, -0.9778, -0.6741],
        [ 0.9914,  0.5567, -0.8159,  0.8510, -0.9965, -0.5310],
        [-0.9939, -0.9768, -0.9899,  0.8326,  0.9877,  0.9370],
        [-0.9953, -0.9870, -0.9901, -0.0209,  0.9555,  0.9608],
        [ 0.9053, -0.6247, -0.6252, -0.3793,  0.6622, -0.6352]],
       device='cuda:0')
squash tensor([[ 2.3132,  0.3378,  1.5777,  0.5101, -2.5921, -1.1348],
        [ 1.9599, -0.4109, -1.3144,  3.2506, -1.5407,  0.7013],
        [-3.0038, -1.9159, -2.4527,  2.6015,  2.3674,  1.7628],
        [-1.2890, -2.0892, -2.6514, -0.1323,  0.4989,  0.8571],
        [ 1.4067,  0.1592, -1.0206, -0.3864,  1.4660,  0.0874],
        [ 1.6705, -0.0515,  2.9897,  1.2277,  0.1236,  0.7035],
        [-2.6144, -0.0889, -1.0118,  0.4370, -0.5824,  0.4431],
        [-1.3741,  3.1541, -1.8596, -1.1488, -0.0964,  1.0201],
        [ 1.6417,  2.8419, -1.6524, -1.8803, -1.6397, -1.2771],
        [ 3.7067, -0.3043,  2.5331, -2.0602, -1.9232, -0.9008],
        [ 3.1323,  0.7527, -0.5913,  0.6121, -3.0140, -1.9942],
        [-2.5958, -2.0325, -2.2452,  0.3185,  2.1013,  1.9126],
        [-1.6055, -2.4273, -1.7002, -0.9628,  1.9313,  1.7173],
        [ 1.1543,  0.8654, -1.2967,  0.1419,  1.0837,  0.6041],
        [ 2.5248, -0.4424,  2.1899,  0.7261, -2.7780, -1.6960],
        [ 2.3119,  0.4951,  2.1157, -0.1006, -2.2441, -0.8183],
        [ 2.7200,  0.6281, -1.1444,  1.2597, -3.1771, -0.5915],
        [-2.8950, -2.2226, -2.6402,  1.1966,  2.5440,  1.7132],
        [-3.0229, -2.5138, -2.6522, -0.0209,  1.8918,  1.9559],
        [ 1.5007, -0.7327, -0.7335, -0.3993,  0.7967, -0.7501]],
       device='cuda:0')
action: tensor([[ 0.9907,  0.6507,  0.9443,  0.5914, -0.9775, -0.4466],
        [ 0.9925, -0.2805, -0.8980,  0.9648,  0.0599, -0.1608],
        [-0.9834, -0.9930, -0.9348,  0.7642,  0.9602,  0.8788],
        [-0.9959, -0.9708, -0.9874, -0.0732,  0.9451,  0.5187],
        [ 0.4470,  0.7231, -0.9712, -0.6650, -0.6578, -0.0219],
        [ 0.9764,  0.1739,  0.9907,  0.7928, -0.8662,  0.3452],
        [ 0.9959,  0.1902,  0.9082,  0.6173, -0.8691, -0.7292],
        [ 0.9876, -0.0823, -0.5133,  0.7424, -0.8693, -0.7243],
        [-0.9761, -0.8279, -0.7610,  0.5924,  0.8662, -0.3911],
        [-0.8100, -0.9785, -0.9658, -0.4150,  0.9615,  0.9202],
        [ 0.5595,  0.8532, -0.9258, -0.3569,  0.1339, -0.5076],
        [ 0.9264, -0.0814,  0.9632,  0.5152, -0.9705, -0.9476],
        [ 0.9658,  0.1120,  0.7301,  0.9704, -0.9688, -0.6324],
        [ 0.0841, -0.8232, -0.7458,  0.9964, -0.8181,  0.5369],
        [-0.9666, -0.9721, -0.9763,  0.9175,  0.9871,  0.8004],
        [-0.9935, -0.8205, -0.8978, -0.9899,  0.1514, -0.7568],
        [ 0.6121,  0.9661, -0.9809, -0.3125,  0.7133, -0.1056],
        [ 0.9698,  0.3459,  0.8965,  0.6717, -0.7108, -0.4438],
        [ 0.9828,  0.5529,  0.9896, -0.1670, -0.8764, -0.8596],
        [ 0.9963,  0.6344,  0.6018,  0.3068, -0.9732, -0.8533]],
       device='cuda:0')
squash tensor([[ 2.6805,  0.7765,  1.7768,  0.6798, -2.2370, -0.4804],
        [ 2.7923, -0.2883, -1.4620,  2.0112,  0.0600, -0.1622],
        [-2.3918, -2.8243, -1.6954,  1.0062,  1.9478,  1.3705],
        [-3.0981, -2.1057, -2.5289, -0.0733,  1.7842,  0.5746],
        [ 0.4810,  0.9141, -2.1126, -0.8018, -0.7889, -0.0219],
        [ 2.2135,  0.1756,  2.6829,  1.0790, -1.3178,  0.3600],
        [ 3.0888,  0.1925,  1.5172,  0.7207, -1.3292, -0.9269],
        [ 2.5384, -0.0824, -0.5671,  0.9559, -1.3302, -0.9166],
        [-2.2072, -1.1815, -0.9986,  0.6814,  1.3176, -0.4131],
        [-1.1271, -2.2615, -2.0253, -0.4416,  1.9651,  1.5901],
        [ 0.6320,  1.2679, -1.6278, -0.3734,  0.1347, -0.5595],
        [ 1.6325, -0.0816,  1.9889,  0.5698, -2.1008, -1.8079],
        [ 2.0254,  0.1124,  0.9290,  2.0991, -2.0724, -0.7453],
        [ 0.0843, -1.1665, -0.9635,  3.1593, -1.1511,  0.5998],
        [-2.0377, -2.1288, -2.2122,  1.5732,  2.5199,  1.0997],
        [-2.8642, -1.1582, -1.4607, -2.6436,  0.1525, -0.9888],
        [ 0.7123,  2.0304, -2.3206, -0.3234,  0.8938, -0.1060],
        [ 2.0884,  0.3608,  1.4542,  0.8138, -0.8888, -0.4769],
        [ 2.3750,  0.6225,  2.6267, -0.1686, -1.3602, -1.2917],
        [ 3.1439,  0.7488,  0.6960,  0.3170, -2.1500, -1.2680]],
       device='cuda:0')
action: tensor([[ 0.9881,  0.1535,  0.9929,  0.6562, -0.8164, -0.8562],
        [ 0.9296, -0.4534, -0.9101,  0.9411, -0.8727, -0.0985],
        [-0.9365, -0.9844, -0.9782,  0.7666,  0.9648,  0.7568],
        [-0.8851, -0.9892, -0.9340, -0.3206,  0.9070,  0.6246],
        [ 0.7265,  0.8546, -0.9602, -0.8218,  0.3953,  0.3061],
        [ 0.9737, -0.0196,  0.8869,  0.2063, -0.5282,  0.7755],
        [ 0.9985,  0.4460,  0.9919,  0.0646, -0.7525, -0.8321],
        [ 0.9784,  0.2793,  0.9564,  0.7062, -0.6965, -0.8125],
        [ 0.9570, -0.4481, -0.3695, -0.0221, -0.9167, -0.9351],
        [-0.9888, -0.9889, -0.5548,  0.3899,  0.8995, -0.7879],
        [-0.9474, -0.9852, -0.9485, -0.7259,  0.9820,  0.9385],
        [ 0.8051,  0.2299, -0.7887, -0.5890,  0.2929,  0.6147],
        [ 0.9925,  0.1355,  0.9962,  0.1086, -0.9690, -0.9653],
        [ 0.9894,  0.4084,  0.9699,  0.5108, -0.9423, -0.7219],
        [ 0.9949, -0.1601, -0.9772,  0.9486, -0.8991, -0.6405],
        [-0.9933, -0.9867, -0.9033,  0.7268,  0.9914,  0.3499],
        [-0.9727, -0.9843, -0.9770, -0.1527,  0.9808,  0.8508],
        [ 0.5076,  0.6999, -0.9334, -0.1878,  0.2340,  0.8159],
        [ 0.9928,  0.0485,  0.9611,  0.6424, -0.7397, -0.3203],
        [ 0.9948,  0.1168,  0.9954,  0.2343, -0.8727, -0.8093]],
       device='cuda:0')
squash tensor([[ 2.5582,  0.1547,  2.8177,  0.7861, -1.1460, -1.2789],
        [ 1.6551, -0.4889, -1.5283,  1.7478, -1.3444, -0.0988],
        [-1.7085, -2.4219, -2.2530,  1.0119,  2.0113,  0.9887],
        [-1.3987, -2.6087, -1.6887, -0.3323,  1.5103,  0.7326],
        [ 0.9212,  1.2728, -1.9479, -1.1623,  0.4181,  0.3162],
        [ 2.1599, -0.0196,  1.4074,  0.2093, -0.5877,  1.0340],
        [ 3.5901,  0.4797,  2.7554,  0.0647, -0.9788, -1.1950],
        [ 2.2598,  0.2869,  1.9023,  0.8796, -0.8606, -1.1344],
        [ 1.9090, -0.4824, -0.3878, -0.0221, -1.5681, -1.6974],
        [-2.5900, -2.5954, -0.6253,  0.4117,  1.4697, -1.0659],
        [-1.8055, -2.4506, -1.8166, -0.9201,  2.3501,  1.7252],
        [ 1.1129,  0.2341, -1.0681, -0.6761,  0.3017,  0.7165],
        [ 2.7879,  0.1363,  3.1354,  0.1091, -2.0756, -2.0179],
        [ 2.6178,  0.4337,  2.0911,  0.5638, -1.7583, -0.9116],
        [ 2.9798, -0.1615, -2.2315,  1.8177, -1.4677, -0.7590],
        [-2.8469, -2.5031, -1.4901,  0.9220,  2.7223,  0.3653],
        [-2.1396, -2.4189, -2.2279, -0.1539,  2.3194,  1.2591],
        [ 0.5595,  0.8670, -1.6845, -0.1900,  0.2384,  1.1444],
        [ 2.8144,  0.0485,  1.9598,  0.7622, -0.9498, -0.3319],
        [ 2.9707,  0.1174,  3.0374,  0.2387, -1.3445, -1.1251]],
       device='cuda:0')
action: tensor([[ 0.9999, -0.8416,  0.9999,  0.9933, -0.1515,  0.6466],
        [ 1.0000, -0.9855,  0.9958,  0.8681,  0.9000,  1.0000],
        [ 0.9976, -0.9927,  0.9966,  0.9609,  0.6614,  0.9833],
        [ 1.0000, -0.5964,  0.9994,  0.9882,  0.9485,  0.7736],
        [ 0.9995, -0.8816,  0.9988,  0.9967,  0.9880,  0.3896],
        [ 0.9991, -0.8097,  0.9991,  0.9954,  0.9887,  0.9710],
        [ 0.9826,  0.2134,  0.9980,  0.9882,  0.9375,  0.9956],
        [ 0.9990, -0.6569,  0.9989,  0.9530,  0.9981,  1.0000],
        [ 0.9985, -0.8485,  0.9642,  0.8088,  0.9650,  1.0000],
        [ 0.9994, -0.8741,  0.9921,  0.8760,  0.9771,  1.0000],
        [ 0.9998, -0.9068,  0.9925,  0.8600,  0.9540,  1.0000],
        [ 0.9995, -0.9108,  0.9959,  0.8846,  0.9908,  1.0000],
        [ 1.0000, -0.8991,  0.9947,  0.8955,  0.9920,  1.0000],
        [ 0.9999, -0.8803,  0.9973,  0.9434,  0.9991,  1.0000],
        [ 0.9999, -0.7939,  0.9998,  0.9889,  0.9996,  1.0000],
        [ 1.0000, -0.3026,  0.9999,  0.9988,  0.9999,  1.0000],
        [ 1.0000, -0.8147,  1.0000,  0.9995,  0.9999,  1.0000],
        [ 0.9991, -0.9527,  1.0000,  0.9982,  0.9996,  1.0000],
        [ 0.9999, -0.9945,  0.9985,  0.9880,  0.9999,  1.0000],
        [ 1.0000, -0.9944,  0.9998,  0.9930,  0.9994,  1.0000]],
       device='cuda:0')
squash tensor([[ 4.8357, -1.2266,  5.1264,  2.8449, -0.1527,  0.7694],
        [ 5.7311, -2.4582,  3.0869,  1.3252,  1.4722,  6.1557],
        [ 3.3569, -2.8034,  3.1902,  1.9575,  0.7953,  2.3895],
        [ 5.4431, -0.6875,  4.0903,  2.5655,  1.8166,  1.0291],
        [ 4.1667, -1.3829,  3.7099,  3.2011,  2.5539,  0.4113],
        [ 3.8416, -1.1261,  3.8285,  3.0316,  2.5833,  2.1094],
        [ 2.3682,  0.2167,  3.4473,  2.5631,  1.7171,  3.0630],
        [ 3.8078, -0.7873,  3.7710,  1.8636,  3.4768,  6.0253],
        [ 3.6105, -1.2507,  2.0028,  1.1237,  2.0134,  5.7297],
        [ 4.0613, -1.3503,  2.7657,  1.3583,  2.2297,  6.9315],
        [ 4.5017, -1.5093,  2.7882,  1.2932,  1.8744,  8.1150],
        [ 4.1253, -1.5322,  3.0910,  1.3967,  2.6904,  8.6643],
        [ 5.3085, -1.4676,  2.9623,  1.4491,  2.7613,  7.5657],
        [ 4.7890, -1.3772,  3.3050,  1.7678,  3.8329,  7.8596],
        [ 5.0571, -1.0818,  4.5321,  2.5948,  4.3175,  7.6914],
        [ 7.0753, -0.3124,  4.8435,  3.7028,  5.1247,  7.5657],
        [ 5.4399, -1.1408,  5.3824,  4.1353,  4.9887,  6.2919],
        [ 3.8596, -1.8607,  6.3719,  3.5083,  4.3151,  6.3233],
        [ 5.0404, -2.9509,  3.5910,  2.5535,  5.0820,  7.3448],
        [ 5.9860, -2.9344,  4.5257,  2.8231,  4.0707,  8.6643]],
       device='cuda:0')
action: tensor([[ 0.9639, -0.1722,  0.9741, -0.7501, -0.8949, -0.9758],
        [ 0.9825,  0.6954,  0.7849, -0.1343, -0.9865, -0.9775],
        [ 0.9828,  0.0315, -0.9809,  0.7915, -0.8693, -0.5111],
        [-0.9765, -0.9630, -0.9646,  0.7384,  0.9761,  0.9968],
        [-0.7806, -0.8338, -0.9259,  0.0050,  0.9827, -0.1836],
        [ 0.4526, -0.3373, -0.5755,  0.8064,  0.9332,  0.1118],
        [ 0.9642,  0.3289,  0.9695,  0.8470, -0.8968,  0.8230],
        [-0.9877, -0.6871, -0.7904,  0.2995, -0.5104,  0.8879],
        [ 0.5537,  0.9649, -0.7441, -0.8963, -0.1214,  0.4386],
        [ 0.9937, -0.6528,  0.8554, -0.9337, -0.8238, -0.9842],
        [ 0.9866,  0.7666, -0.7035,  0.5777, -0.8767, -0.7782],
        [-0.9901, -0.8029, -0.9619,  0.2332,  0.6436,  0.9511],
        [-0.9794, -0.8227, -0.8969, -0.4325,  0.9650,  0.7876],
        [ 0.8991,  0.0882,  0.6328,  0.7418,  0.7830,  0.7279],
        [ 0.9837,  0.3458,  0.9876,  0.4151, -0.9823, -0.8925],
        [ 0.8823,  0.3252,  0.9274,  0.2915, -0.9077, -0.8108],
        [ 0.9925,  0.4961, -0.9855,  0.9613, -0.9294,  0.7846],
        [-0.9760, -0.9292, -0.9814,  0.9408,  0.9303,  0.9863],
        [-0.9189, -0.8791, -0.9098, -0.1257,  0.5657,  0.1434],
        [ 0.2610, -0.3768, -0.6255, -0.6197,  0.6905,  0.1357]],
       device='cuda:0')
squash tensor([[ 1.9988, -0.1739,  2.1665, -0.9732, -1.4461, -2.2012],
        [ 2.3642,  0.8584,  1.0581, -0.1351, -2.4955, -2.2391],
        [ 2.3728,  0.0315, -2.3214,  1.0754, -1.3304, -0.5643],
        [-2.2159, -1.9855, -2.0083,  0.9469,  2.2082,  3.2159],
        [-1.0469, -1.2005, -1.6290,  0.0050,  2.3717, -0.1857],
        [ 0.4879, -0.3510, -0.6557,  1.1166,  1.6829,  0.1122],
        [ 2.0032,  0.3416,  2.0838,  1.2453, -1.4557,  1.1660],
        [-2.5429, -0.8425, -1.0725,  0.3090, -0.5633,  1.4117],
        [ 0.6238,  2.0122, -0.9596, -1.4530, -0.1220,  0.4705],
        [ 2.8803, -0.7802,  1.2759, -1.6869, -1.1684, -2.4150],
        [ 2.5005,  1.0121, -0.8743,  0.6590, -1.3614, -1.0409],
        [-2.6513, -1.1066, -1.9712,  0.2376,  0.7643,  1.8435],
        [-2.2828, -1.1651, -1.4561, -0.4630,  2.0135,  1.0650],
        [ 1.4677,  0.0885,  0.7461,  0.9544,  1.0530,  0.9243],
        [ 2.4023,  0.3607,  2.5372,  0.4418, -2.3598, -1.4343],
        [ 1.3863,  0.3375,  1.6398,  0.3002, -1.5144, -1.1293],
        [ 2.7895,  0.5441, -2.4609,  1.9632, -1.6542,  1.0572],
        [-2.2063, -1.6528, -2.3333,  1.7453,  1.6605,  2.4894],
        [-1.5819, -1.3719, -1.5262, -0.1264,  0.6412,  0.1444],
        [ 0.2672, -0.3963, -0.7340, -0.7245,  0.8489,  0.1365]],
       device='cuda:0')
action: tensor([[-0.8447,  0.1218, -0.7714, -0.6551, -0.6791,  0.8226],
        [ 0.7711,  0.8474, -0.9213, -0.9732,  0.0306,  0.2004],
        [ 0.9853, -0.5482,  0.9945, -0.9716, -0.9093,  0.1042],
        [ 0.9937,  0.3313, -0.5714,  0.4946, -0.9255, -0.9344],
        [-0.8882, -0.8392, -0.9681,  0.9164,  0.9342,  0.8389],
        [-0.9841, -0.9975, -0.9739, -0.8386,  0.9624,  0.8564],
        [ 0.8273,  0.2160, -0.9138,  0.2711,  0.6272, -0.1615],
        [ 0.9785,  0.3612,  0.9900,  0.0472, -0.8042, -0.3780],
        [ 0.9920, -0.5536,  0.9698,  0.4171, -0.9020, -0.7728],
        [ 0.9524,  0.4410,  0.9035,  0.2799, -0.9689, -0.9312],
        [ 0.9904,  0.1010, -0.5498,  0.5446, -0.8471, -0.9090],
        [-0.9967, -0.9807, -0.9108,  0.4046,  0.9123, -0.4024],
        [-0.9422, -0.9405, -0.9857, -0.5017,  0.9612,  0.8337],
        [ 0.5526,  0.6967, -0.9254, -0.5088,  0.3273,  0.2256],
        [ 0.9889,  0.3153,  0.9928,  0.5704, -0.6776, -0.6927],
        [ 0.9767, -0.0172,  0.9804,  0.9509, -0.9486, -0.0961],
        [ 0.8072, -0.8772, -0.8919,  0.9797, -0.8474, -0.8707],
        [-0.9766, -0.9756, -0.8820,  0.9929,  0.9808,  0.9544],
        [-0.9781, -0.9414, -0.8676, -0.7599,  0.9878,  0.7779],
        [-0.3294,  0.9763, -0.9814, -0.7844, -0.0337,  0.9424]],
       device='cuda:0')
squash tensor([[-1.2374,  0.1224, -1.0238, -0.7842, -0.8274,  1.1647],
        [ 1.0230,  1.2468, -1.5978, -2.1503,  0.0306,  0.2031],
        [ 2.4535, -0.6158,  2.9489, -2.1193, -1.5235,  0.1046],
        [ 2.8764,  0.3443, -0.6497,  0.5421, -1.6259, -1.6918],
        [-1.4135, -1.2186, -2.0613,  1.5659,  1.6902,  1.2176],
        [-2.4147, -3.3391, -2.1628, -1.2163,  1.9776,  1.2798],
        [ 1.1796,  0.2195, -1.5502,  0.2781,  0.7369, -0.1630],
        [ 2.2615,  0.3783,  2.6488,  0.0473, -1.1103, -0.3977],
        [ 2.7572, -0.6235,  2.0891,  0.4442, -1.4830, -1.0272],
        [ 1.8570,  0.4735,  1.4912,  0.2876, -2.0741, -1.6671],
        [ 2.6649,  0.1014, -0.6182,  0.6106, -1.2457, -1.5216],
        [-3.1989, -2.3163, -1.5321,  0.4291,  1.5409, -0.4265],
        [-1.7569, -1.7425, -2.4659, -0.5515,  1.9610,  1.2001],
        [ 0.6221,  0.8608, -1.6251, -0.5611,  0.3398,  0.2296],
        [ 2.5954,  0.3264,  2.8095,  0.6481, -0.8247, -0.8531],
        [ 2.2210, -0.0172,  2.3067,  1.8412, -1.8180, -0.0964],
        [ 1.1189, -1.3633, -1.4309,  2.2907, -1.2467, -1.3361],
        [-2.2174, -2.1979, -1.3847,  2.8173,  2.3172,  1.8793],
        [-2.2513, -1.7503, -1.3235, -0.9959,  2.5467,  1.0401],
        [-0.3421,  2.2116, -2.3329, -1.0566, -0.0337,  1.7589]],
       device='cuda:0')
action: tensor([[-0.9615, -0.9498, -0.9794,  0.8388,  0.9322,  0.9760],
        [-0.9799, -0.8476, -0.9468, -0.3226,  0.9270,  0.9405],
        [ 0.9654,  0.4238, -0.6611,  0.2906,  0.6888,  0.4985],
        [ 0.9695, -0.2949,  0.9664,  0.3565, -0.8959, -0.7340],
        [ 0.9783, -0.1971,  0.9859,  0.4122, -0.9439, -0.6109],
        [ 0.9354,  0.1623,  0.8541,  0.8391, -0.9484, -0.7362],
        [-0.9802, -0.9743, -0.9989,  0.8393,  0.9362,  0.2499],
        [-0.9709, -0.9868, -0.9338, -0.6176,  0.9952,  0.5320],
        [ 0.7065,  0.2321, -0.7164,  0.1584,  0.7587,  0.1508],
        [ 0.9594, -0.0170,  0.9978,  0.0541, -0.8362, -0.8928],
        [ 0.9873, -0.4331,  0.9355,  0.7623, -0.6034, -0.5100],
        [ 0.4954, -0.8415, -0.6215,  0.9807, -0.8081, -0.9766],
        [-0.9969, -0.8946, -0.9572,  0.9068,  0.9236,  0.5244],
        [-0.9632, -0.9873, -0.9761, -0.8923,  0.9811,  0.6600],
        [ 0.8821,  0.6809, -0.8609, -0.0769,  0.3970,  0.8804],
        [ 0.9883, -0.0070,  0.9446, -0.2634, -0.4594, -0.6104],
        [ 0.9803, -0.3372,  0.9009,  0.7582, -0.9058, -0.6603],
        [ 0.9360, -0.4346, -0.0456,  0.8782, -0.8884, -0.7452],
        [-0.9966, -0.9639, -0.8587,  0.6090,  0.9586,  0.4555],
        [-0.9072, -0.9837, -0.9550, -0.6900,  0.8897,  0.6505]],
       device='cuda:0')
squash tensor([[-1.9651, -1.8295, -2.2823,  1.2172,  1.6748,  2.2059],
        [-2.2943, -1.2477, -1.7995, -0.3345,  1.6364,  1.7424],
        [ 2.0200,  0.4523, -0.7948,  0.2992,  0.8458,  0.5473],
        [ 2.0845, -0.3039,  2.0345,  0.3728, -1.4513, -0.9374],
        [ 2.2554, -0.1997,  2.4753,  0.4382, -1.7729, -0.7104],
        [ 1.7002,  0.1638,  1.2711,  1.2180, -1.8158, -0.9421],
        [-2.3022, -2.1714, -3.7619,  1.2189,  1.7061,  0.2553],
        [-2.1083, -2.5074, -1.6870, -0.7211,  3.0133,  0.5929],
        [ 0.8801,  0.2364, -0.9003,  0.1598,  0.9932,  0.1520],
        [ 1.9387, -0.0170,  3.3956,  0.0542, -1.2083, -1.4355],
        [ 2.5266, -0.4637,  1.7009,  1.0017, -0.6985, -0.5627],
        [ 0.5432, -1.2262, -0.7274,  2.3160, -1.1215, -2.2185],
        [-3.2271, -1.4446, -1.9115,  1.5091,  1.6129,  0.5824],
        [-1.9885, -2.5251, -2.2084, -1.4332,  2.3266,  0.7929],
        [ 1.3853,  0.8307, -1.2968, -0.0770,  0.4201,  1.3777],
        [ 2.5684, -0.0070,  1.7793, -0.2698, -0.4966, -0.7095],
        [ 2.3045, -0.3509,  1.4771,  0.9920, -1.5035, -0.7934],
        [ 1.7049, -0.4656, -0.0456,  1.3680, -1.4142, -0.9621],
        [-3.1823, -1.9980, -1.2884,  0.7073,  1.9278,  0.4916],
        [-1.5116, -2.4005, -1.8854, -0.8479,  1.4206,  0.7761]],
       device='cuda:0')
action: tensor([[ 0.9840,  0.6024,  0.8812, -0.1392, -0.8382, -0.9010],
        [ 0.9912,  0.8668, -0.8203,  0.1067, -0.9763, -0.9581],
        [-0.9944, -0.9656, -0.9737, -0.0808,  0.9866,  0.6405],
        [-0.9595, -0.9776, -0.9790, -0.6557,  0.9851,  0.7716],
        [ 0.9743,  0.7837, -0.8283, -0.5414,  0.8504,  0.0489],
        [ 0.8090, -0.9304,  0.9746,  0.4448, -0.5852,  0.1243],
        [ 0.9856, -0.1667,  0.9615,  0.0505, -0.8389, -0.7430],
        [ 0.9739, -0.2014,  0.7952,  0.8401, -0.9250, -0.9581],
        [-0.9863, -0.7148, -0.8672,  0.4981,  0.9782,  0.0593],
        [-0.9838, -0.9568, -0.9536, -0.3676,  0.9280, -0.0760],
        [ 0.6772,  0.6758, -0.8847, -0.2949,  0.5753,  0.3345],
        [ 0.9640, -0.1830,  0.9931, -0.4457, -0.9731, -0.7022],
        [ 0.9975, -0.7792,  0.9818,  0.7722, -0.8096,  0.0671],
        [ 0.9191, -0.8284, -0.6165,  0.7570, -0.8451, -0.8720],
        [-0.9958, -0.9775, -0.9250,  0.9243,  0.9882,  0.6560],
        [-0.9760, -0.9775, -0.9956, -0.9275,  0.8997,  0.4961],
        [ 0.2511,  0.6985, -0.9398, -0.9342,  0.4650, -0.1599],
        [ 0.9849,  0.5558,  0.9921,  0.5988, -0.6858,  0.3822],
        [ 0.9254,  0.3180,  0.9479, -0.2807, -0.7527, -0.5862],
        [ 0.9466,  0.3187,  0.9494, -0.1490, -0.8310, -0.8529]],
       device='cuda:0')
squash tensor([[ 2.4115,  0.6969,  1.3809, -0.1401, -1.2150, -1.4773],
        [ 2.7122,  1.3201, -1.1579,  0.1071, -2.2127, -1.9220],
        [-2.9410, -2.0226, -2.1592, -0.0809,  2.5008,  0.7590],
        [-1.9396, -2.2414, -2.2731, -0.7852,  2.4475,  1.0244],
        [ 2.1703,  1.0548, -1.1828, -0.6061,  1.2574,  0.0489],
        [ 1.1242, -1.6611,  2.1758,  0.4782, -0.6704,  0.1249],
        [ 2.4649, -0.1683,  1.9658,  0.0506, -1.2175, -0.9571],
        [ 2.1635, -0.2042,  1.0855,  1.2215, -1.6227, -1.9227],
        [-2.4866, -0.8970, -1.3218,  0.5468,  2.2540,  0.0594],
        [-2.4051, -1.9070, -1.8705, -0.3857,  1.6436, -0.0761],
        [ 0.8240,  0.8214, -1.3971, -0.3039,  0.6555,  0.3479],
        [ 1.9996, -0.1851,  2.8295, -0.4793, -2.1474, -0.8716],
        [ 3.3380, -1.0434,  2.3441,  1.0258, -1.1259,  0.0672],
        [ 1.5834, -1.1831, -0.7193,  0.9891, -1.2387, -1.3416],
        [-3.0770, -2.2375, -1.6229,  1.6178,  2.5650,  0.7857],
        [-2.2047, -2.2380, -3.0544, -1.6403,  1.4704,  0.5441],
        [ 0.2566,  0.8643, -1.7360, -1.6903,  0.5037, -0.1612],
        [ 2.4380,  0.6267,  2.7680,  0.6913, -0.8399,  0.4026],
        [ 1.6255,  0.3294,  1.8109, -0.2884, -0.9793, -0.6719],
        [ 1.7977,  0.3302,  1.8260, -0.1501, -1.1913, -1.2666]],
       device='cuda:0')
action: tensor([[ 0.9296,  0.1207,  0.7167,  0.3257, -0.9889, -0.8428],
        [ 0.9943,  0.1231, -0.9744,  0.9818, -0.5931,  0.9087],
        [-0.9868, -0.9897, -0.9792,  0.9954,  0.9804,  0.7151],
        [-0.9806, -0.9929, -0.9004,  0.1690,  0.8711,  0.5602],
        [ 0.8681, -0.0968, -0.8990, -0.4609,  0.8837,  0.7296],
        [ 0.9758,  0.3239,  0.9825,  0.4438, -0.1706,  0.8715],
        [-0.8714, -0.0249, -0.8472,  0.4140,  0.1916, -0.2732],
        [-0.9858,  0.9889, -0.8206, -0.9007, -0.5030,  0.7968],
        [ 0.9561,  0.9552, -0.8819, -0.9708, -0.8013, -0.2991],
        [ 0.9960, -0.5333,  0.9778, -0.9786, -0.9792, -0.9674],
        [ 0.9745,  0.5894, -0.9335,  0.4329, -0.9733, -0.9855],
        [-0.9978, -0.8234, -0.9140,  0.8564,  0.9558,  0.9575],
        [-0.9859, -0.9901, -0.9770, -0.9093,  0.9713,  0.9406],
        [ 0.5983,  0.9517, -0.9855,  0.2282,  0.1432,  0.0212],
        [ 0.9955,  0.1215,  0.9836,  0.4331, -0.8376, -0.0756],
        [ 0.9849,  0.6032,  0.8110,  0.0694, -0.9794,  0.0328],
        [ 0.9724, -0.3209, -0.8817,  0.9013, -0.9569,  0.3430],
        [-0.9842, -0.9882, -0.9483,  0.7772,  0.9523,  0.4540],
        [-0.9813, -0.9930, -0.9113, -0.3332,  0.9813,  0.9467],
        [ 0.9263,  0.9043, -0.9289, -0.5980,  0.1964,  0.0872]],
       device='cuda:0')
squash tensor([[ 1.6557,  0.1213,  0.9008,  0.3380, -2.5957, -1.2307],
        [ 2.9302,  0.1237, -2.1726,  2.3442, -0.6824,  1.5202],
        [-2.5071, -2.6296, -2.2772,  3.0313,  2.3077,  0.8976],
        [-2.3120, -2.8209, -1.4743,  0.1706,  1.3376,  0.6331],
        [ 1.3252, -0.0971, -1.4669, -0.4984,  1.3925,  0.9279],
        [ 2.2016,  0.3361,  2.3664,  0.4770, -0.1723,  1.3393],
        [-1.3390, -0.0249, -1.2461,  0.4404,  0.1940, -0.2803],
        [-2.4706,  2.5930, -1.1585, -1.4761, -0.5534,  1.0899],
        [ 1.8988,  1.8882, -1.3844, -2.1069, -1.1023, -0.3085],
        [ 3.1122, -0.5948,  2.2444, -2.2628, -2.2770, -2.0507],
        [ 2.1744,  0.6767, -1.6847,  0.4634, -2.1512, -2.4609],
        [-3.4159, -1.1673, -1.5514,  1.2795,  1.8949,  1.9150],
        [-2.4751, -2.6511, -2.2264, -1.5232,  2.1151,  1.7436],
        [ 0.6905,  1.8491, -2.4601,  0.2323,  0.1442,  0.0212],
        [ 3.0492,  0.1221,  2.3967,  0.4637, -1.2132, -0.0757],
        [ 2.4392,  0.6982,  1.1299,  0.0695, -2.2838,  0.0328],
        [ 2.1351, -0.3327, -1.3834,  1.4790, -1.9077,  0.3575],
        [-2.4177, -2.5644, -1.8142,  1.0383,  1.8558,  0.4897],
        [-2.3302, -2.8245, -1.5353, -0.3464,  2.3320,  1.7992],
        [ 1.6317,  1.4955, -1.6504, -0.6900,  0.1990,  0.0874]],
       device='cuda:0')
action: tensor([[ 0.8144,  0.9250,  0.3439, -0.2147, -0.9041, -0.4941],
        [-0.1347, -0.4550,  0.4037,  0.7019,  0.6502,  0.6324],
        [ 0.9145,  0.7554, -0.8688, -0.2483, -0.9455, -0.8040],
        [-0.6407,  0.3619, -0.9807,  0.0837, -0.7818, -0.7528],
        [-0.8881, -0.6199, -0.9686, -0.3429, -0.5244, -0.6649],
        [ 0.4526,  0.9512, -0.6488, -0.7088,  0.1913,  0.3969],
        [ 0.9588, -0.3100,  0.9630, -0.9236, -0.4719, -0.6784],
        [ 0.1754, -0.2955,  0.9468, -0.9779,  0.3418,  0.1684],
        [ 0.9823,  0.4107,  0.9433, -0.8697,  0.4558, -0.5885],
        [ 0.9400,  0.6905,  0.4034, -0.7378,  0.1145, -0.2294],
        [ 0.9846,  0.6103,  0.9440, -0.7487, -0.1783, -0.4982],
        [ 0.9773,  0.2968, -0.1756, -0.3893, -0.9352, -0.7808],
        [ 0.9841,  0.2132,  0.2550, -0.5016, -0.9163, -0.9476],
        [ 0.9400, -0.7794, -0.2961, -0.0969, -0.9053, -0.9470],
        [-0.9113, -0.9642, -0.9434,  0.5990, -0.1287, -0.9523],
        [-0.9746, -0.9847, -0.9580, -0.4221,  0.9950,  0.4863],
        [-0.2317,  0.1447, -0.9614, -0.9933,  0.9085, -0.1932],
        [ 0.9771,  0.9712,  0.4833, -0.1561, -0.9698, -0.8595],
        [ 0.9655,  0.5245,  0.9380,  0.6209, -0.9963, -0.6736],
        [ 0.9929, -0.3211, -0.9838,  0.9703, -0.3981,  0.5258]],
       device='cuda:0')
squash tensor([[ 1.1401,  1.6224,  0.3586, -0.2181, -1.4944, -0.5415],
        [-0.1355, -0.4909,  0.4281,  0.8709,  0.7756,  0.7454],
        [ 1.5541,  0.9853, -1.3282, -0.2536, -1.7871, -1.1097],
        [-0.7594,  0.3791, -2.3147,  0.0839, -1.0499, -0.9793],
        [-1.4127, -0.7249, -2.0692, -0.3574, -0.5824, -0.8016],
        [ 0.4879,  1.8437, -0.7732, -0.8848,  0.1937,  0.4200],
        [ 1.9312, -0.3205,  1.9853, -1.6131, -0.5125, -0.8262],
        [ 0.1772, -0.3046,  1.8004, -2.2481,  0.3562,  0.1701],
        [ 2.3603,  0.4364,  1.7674, -1.3319,  0.4920, -0.6753],
        [ 1.7378,  0.8490,  0.4277, -0.9456,  0.1150, -0.2336],
        [ 2.4308,  0.7093,  1.7738, -0.9700, -0.1802, -0.5469],
        [ 2.2342,  0.3060, -0.1775, -0.4110, -1.6985, -1.0474],
        [ 2.4127,  0.2165,  0.2607, -0.5515, -1.5657, -1.8073],
        [ 1.7383, -1.0437, -0.3053, -0.0972, -1.5007, -1.8017],
        [-1.5350, -2.0026, -1.7677,  0.6916, -0.1294, -1.8554],
        [-2.1760, -2.4317, -1.9211, -0.4502,  2.9985,  0.5312],
        [-0.2360,  0.1457, -1.9639, -2.8451,  1.5190, -0.1957],
        [ 2.2282,  2.1132,  0.5273, -0.1574, -2.0897, -1.2914],
        [ 2.0207,  0.5825,  1.7212,  0.7264, -3.1444, -0.8173],
        [ 2.8153, -0.3329, -2.4025,  2.0976, -0.4213,  0.5844]],
       device='cuda:0')
action: tensor([[-0.9752, -0.9852, -0.8464,  0.9357,  0.9936,  0.9614],
        [-0.9840, -0.9290, -0.9606, -0.1524,  0.8082,  0.5341],
        [ 0.7076,  0.1019, -0.1849, -0.1415,  0.3826,  0.2914],
        [ 0.8206,  0.3842,  0.8461,  0.4763, -0.7471, -0.3946],
        [-0.3705,  0.0039,  0.1234,  0.8210, -0.5435,  0.5389],
        [-0.7525,  0.8408, -0.9454, -0.1977, -0.6885,  0.8424],
        [ 0.8435,  0.7638, -0.9522, -0.9496, -0.3258, -0.2921],
        [ 0.9959, -0.9559,  0.9653, -0.8288, -0.9585, -0.9729],
        [ 0.9969, -0.9743, -0.9748,  0.8019, -0.9711, -0.8932],
        [-0.9898, -0.9662, -0.9340,  0.7498,  0.9857,  0.9846],
        [-0.9937, -0.9986, -0.9769, -0.8852,  0.9774,  0.9009],
        [ 0.9472, -0.2746, -0.0905,  0.7795,  0.9573,  0.1251],
        [ 0.9623,  0.5769,  0.9843,  0.5929, -0.9516, -0.7373],
        [ 0.9961,  0.2231,  0.8786,  0.8291, -0.9648, -0.2960],
        [ 0.9940, -0.0670, -0.9598,  0.9928, -0.9824,  0.5689],
        [-0.9885, -0.8096, -0.9434,  0.9809,  0.9890,  0.9584],
        [-0.9450, -0.9431, -0.9669,  0.1538,  0.8974,  0.1173],
        [ 0.6860, -0.2907, -0.7216, -0.7499,  0.5881,  0.7986],
        [ 0.9883,  0.2944,  0.9981,  0.4598, -0.5399,  0.3101],
        [-0.8311, -0.6573, -0.9520,  0.8054,  0.8065,  0.9424]],
       device='cuda:0')
squash tensor([[-2.1894, -2.4497, -1.2432,  1.7022,  2.8690,  1.9639],
        [-2.4101, -1.6513, -1.9539, -0.1536,  1.1218,  0.5959],
        [ 0.8824,  0.1022, -0.1871, -0.1424,  0.4031,  0.3001],
        [ 1.1586,  0.4050,  1.2422,  0.5182, -0.9663, -0.4172],
        [-0.3889,  0.0039,  0.1240,  1.1599, -0.6091,  0.6026],
        [-0.9787,  1.2238, -1.7862, -0.2003, -0.8452,  1.2294],
        [ 1.2333,  1.0053, -1.8548, -1.8279, -0.3381, -0.3009],
        [ 3.0908, -1.8958,  2.0187, -1.1844, -1.9275, -2.1444],
        [ 3.2366, -2.1699, -2.1801,  1.1039, -2.1120, -1.4375],
        [-2.6381, -2.0321, -1.6888,  0.9725,  2.4653,  2.4295],
        [-2.8807, -3.6282, -2.2249, -1.3995,  2.2352,  1.4770],
        [ 1.8040, -0.2819, -0.0907,  1.0440,  1.9129,  0.1258],
        [ 1.9756,  0.6578,  2.4204,  0.6821, -1.8482, -0.9446],
        [ 3.1127,  0.2269,  1.3695,  1.1852, -2.0112, -0.3051],
        [ 2.9053, -0.0671, -1.9435,  2.8084, -2.3630,  0.6459],
        [-2.5763, -1.1260, -1.7685,  2.3212,  2.6006,  1.9254],
        [-1.7831, -1.7651, -2.0418,  0.1550,  1.4586,  0.1178],
        [ 0.8403, -0.2993, -0.9110, -0.9726,  0.6747,  1.0948],
        [ 2.5657,  0.3034,  3.4759,  0.4970, -0.6040,  0.3207],
        [-1.1915, -0.7881, -1.8525,  1.1137,  1.1169,  1.7589]],
       device='cuda:0')
action: tensor([[ 0.8655,  0.2071,  0.9394,  0.0301, -0.8409, -0.4815],
        [ 0.8997, -0.7074,  0.9967,  0.8703, -0.7221, -0.5427],
        [ 0.9854,  0.5943,  0.9602,  0.6196, -0.8064, -0.8403],
        [ 0.9754, -0.2246, -0.8843,  0.4101, -0.9578, -0.8512],
        [-0.9508, -0.9355, -0.9300,  0.4998,  0.8514, -0.9397],
        [-0.9643, -0.9686, -0.9176, -0.6815,  0.9880,  0.9588],
        [ 0.8048,  0.9237, -0.9025, -0.8836,  0.1395, -0.0659],
        [ 0.9626, -0.1119,  0.9620,  0.3219, -0.7025, -0.8963],
        [ 0.9152,  0.4599,  0.9355,  0.4715, -0.9104, -0.1163],
        [ 0.8843, -0.9485, -0.9164,  0.9772, -0.9131, -0.9647],
        [-0.9265, -0.8918, -0.9728,  0.6730,  0.9347, -0.3471],
        [-0.9387, -0.9402, -0.9864, -0.7000,  0.9840,  0.5417],
        [-0.5878,  0.9787, -0.9154, -0.8364,  0.1767, -0.7575],
        [ 0.9713, -0.0146,  0.9908,  0.2727, -0.5651,  0.3238],
        [ 0.9977, -0.1083,  0.9014,  0.9605, -0.7270, -0.5397],
        [ 0.9895, -0.9857, -0.9937,  0.9961, -0.7856, -0.9262],
        [-0.9832, -0.9122, -0.9839,  0.7878,  0.9639, -0.8400],
        [-0.9317, -0.9275, -0.9881, -0.7390,  0.9650,  0.8861],
        [ 0.0203,  0.9924, -0.9840, -0.8488, -0.8564,  0.7591],
        [ 0.9627,  0.9857,  0.2799,  0.1885, -0.9568,  0.6227]],
       device='cuda:0')
squash tensor([[ 1.3148,  0.2102,  1.7328,  0.0301, -1.2241, -0.5249],
        [ 1.4706, -0.8819,  3.2069,  1.3344, -0.9121, -0.6080],
        [ 2.4578,  0.6843,  1.9485,  0.7244, -1.1165, -1.2222],
        [ 2.1932, -0.2285, -1.3950,  0.4357, -1.9185, -1.2606],
        [-1.8400, -1.7010, -1.6582,  0.5490,  1.2614, -1.7358],
        [-2.0040, -2.0688, -1.5737, -0.8320,  2.5545,  1.9308],
        [ 1.1122,  1.6137, -1.4855, -1.3919,  0.1405, -0.0660],
        [ 1.9803, -0.1123,  1.9720,  0.3337, -0.8721, -1.4531],
        [ 1.5585,  0.4971,  1.7005,  0.5120, -1.5300, -0.1168],
        [ 1.3954, -1.8162, -1.5661,  2.2323, -1.5460, -2.0098],
        [-1.6327, -1.4308, -2.1414,  0.8162,  1.6947, -0.3622],
        [-1.7272, -1.7395, -2.4907, -0.8674,  2.4106,  0.6066],
        [-0.6743,  2.2666, -1.5601, -1.2090,  0.1786, -0.9903],
        [ 2.1152, -0.0146,  2.6898,  0.2798, -0.6403,  0.3358],
        [ 3.3775, -0.1088,  1.4796,  1.9517, -0.9223, -0.6037],
        [ 2.6223, -2.4654, -2.8769,  3.1140, -1.0599, -1.6308],
        [-2.3859, -1.5403, -2.4083,  1.0657,  1.9982, -1.2213],
        [-1.6713, -1.6401, -2.5599, -0.9483,  2.0145,  1.4034],
        [ 0.0203,  2.7825, -2.4100, -1.2517, -1.2796,  0.9942],
        [ 1.9822,  2.4671,  0.2876,  0.1908, -1.9064,  0.7294]],
       device='cuda:0')
action: tensor([[ 0.9688,  0.6980,  0.8546,  0.6829, -0.8536, -0.8779],
        [ 0.9520, -0.0514, -0.4203,  0.4926, -0.9755, -0.8058],
        [-0.8431, -0.9883, -0.8952,  0.3754,  0.9657,  0.2051],
        [-0.9791, -0.9762, -0.9693, -0.6477,  0.9232,  0.9207],
        [ 0.5683,  0.9190, -0.9164, -0.0984,  0.6535,  0.5066],
        [ 0.9964, -0.4971,  0.9897,  0.3318, -0.9248, -0.4479],
        [ 0.9903,  0.3927,  0.9659,  0.4276, -0.9313, -0.9264],
        [ 0.9707,  0.0195, -0.9264,  0.9466, -0.9274, -0.7914],
        [-0.9941, -0.9909, -0.9572,  0.9194,  0.9889,  0.6637],
        [-0.9659, -0.9415, -0.9702, -0.7251,  0.9250,  0.6047],
        [ 0.9101,  0.4862, -0.9441, -0.1364,  0.1203, -0.2409],
        [ 0.9816,  0.0438,  0.9822,  0.3198, -0.7899, -0.4859],
        [ 0.9904, -0.3540,  0.9632,  0.5455, -0.8294, -0.6279],
        [ 0.9756,  0.4006, -0.5726,  0.8276, -0.9031, -0.5586],
        [-0.9880, -0.9580, -0.9860,  0.5610,  0.9777, -0.2768],
        [-0.9696, -0.9506, -0.9143, -0.2997,  0.9729,  0.8024],
        [ 0.9393,  0.9691, -0.8571, -0.9292, -0.0435,  0.3645],
        [ 0.9854,  0.0600,  0.9621,  0.0994, -0.6923, -0.3548],
        [ 0.9953,  0.4207,  0.9895,  0.2810, -0.8523,  0.2596],
        [ 0.9910,  0.0033, -0.2741,  0.4881, -0.9225, -0.8933]],
       device='cuda:0')
squash tensor([[ 2.0731,  0.8633,  1.2730,  0.8345, -1.2692, -1.3665],
        [ 1.8528, -0.0515, -0.4480,  0.5395, -2.1946, -1.1148],
        [-1.2320, -2.5664, -1.4473,  0.3947,  2.0240,  0.2080],
        [-2.2747, -2.2102, -2.0807, -0.7714,  1.6102,  1.5936],
        [ 0.6450,  1.5828, -1.5661, -0.0987,  0.7813,  0.5581],
        [ 3.1601, -0.5454,  2.6304,  0.3448, -1.6209, -0.4820],
        [ 2.6644,  0.4149,  2.0266,  0.4570, -1.6681, -1.6324],
        [ 2.1051,  0.0195, -1.6321,  1.7980, -1.6398, -1.0752],
        [-2.9101, -2.6939, -1.9116,  1.5849,  2.5947,  0.7994],
        [-2.0266, -1.7512, -2.0958, -0.9183,  1.6227,  0.7005],
        [ 1.5279,  0.5311, -1.7741, -0.1372,  0.1209, -0.2457],
        [ 2.3392,  0.0438,  2.3553,  0.3315, -1.0712, -0.5306],
        [ 2.6693, -0.3700,  1.9879,  0.6120, -1.1862, -0.7379],
        [ 2.1969,  0.4244, -0.6514,  1.1806, -1.4886, -0.6308],
        [-2.5538, -1.9207, -2.4767,  0.6343,  2.2424, -0.2842],
        [-2.0860, -1.8379, -1.5530, -0.3091,  2.1438,  1.1053],
        [ 1.7317,  2.0773, -1.2821, -1.6525, -0.0435,  0.3821],
        [ 2.4555,  0.0601,  1.9729,  0.0997, -0.8524, -0.3709],
        [ 3.0306,  0.4485,  2.6227,  0.2888, -1.2644,  0.2656],
        [ 2.6970,  0.0033, -0.2813,  0.5335, -1.6056, -1.4381]],
       device='cuda:0')
action: tensor([[ 0.7549,  0.8535, -0.7606, -0.9267,  0.1001, -0.0574],
        [ 0.9805, -0.8312,  0.9368, -0.9349, -0.8773, -0.8877],
        [ 0.9920,  0.5868, -0.9364,  0.3248, -0.9314, -0.5402],
        [-0.9750, -0.9718, -0.9930,  0.4752,  0.9748,  0.5923],
        [-0.9534, -0.9921, -0.9813, -0.4747,  0.9632,  0.6002],
        [ 0.7453,  0.6486, -0.9178,  0.0949,  0.7458, -0.0208],
        [ 0.9841, -0.4084,  0.9964,  0.1008, -0.9512,  0.2754],
        [ 0.9949, -0.2574,  0.9836,  0.3181, -0.7496, -0.1002],
        [ 0.9789,  0.0152,  0.8326,  0.8163, -0.9803, -0.5118],
        [ 0.9242, -0.6445, -0.0742,  0.5414, -0.9582, -0.9691],
        [-0.9873, -0.9776, -0.9689,  0.5091,  0.9888,  0.6504],
        [-0.8417, -0.9938, -0.9548, -0.6051,  0.9768,  0.7093],
        [ 0.8070,  0.5420, -0.3381, -0.0074,  0.6544,  0.4025],
        [ 0.9962, -0.1386,  0.9936,  0.5201, -0.9843, -0.8350],
        [ 0.9964,  0.7599,  0.9920,  0.0213, -0.9516,  0.2423],
        [ 0.9812, -0.2226, -0.8897,  0.8148, -0.9810, -0.7696],
        [-0.9861, -0.9184, -0.9504,  0.9194,  0.9798,  0.9447],
        [-0.9717, -0.9475, -0.9574, -0.3551,  0.9215,  0.7738],
        [ 0.8980, -0.2182, -0.7158,  0.0341,  0.8972,  0.3813],
        [ 0.9492,  0.3129,  0.9202,  0.3559, -0.7745, -0.8005]],
       device='cuda:0')
squash tensor([[ 0.9842,  1.2689, -0.9977, -1.6348,  0.1004, -0.0574],
        [ 2.3107, -1.1921,  1.7109, -1.6956, -1.3638, -1.4110],
        [ 2.7592,  0.6728, -1.7082,  0.3370, -1.6685, -0.6045],
        [-2.1853, -2.1245, -2.8278,  0.5168,  2.1817,  0.6813],
        [-1.8681, -2.7649, -2.3315, -0.5161,  1.9887,  0.6935],
        [ 0.9623,  0.7728, -1.5748,  0.0952,  0.9635, -0.0208],
        [ 2.4142, -0.4337,  3.1584,  0.1012, -1.8443,  0.2827],
        [ 2.9801, -0.2634,  2.3977,  0.3295, -0.9721, -0.1006],
        [ 2.2699,  0.0152,  1.1965,  1.1457, -2.3057, -0.5652],
        [ 1.6172, -0.7658, -0.0743,  0.6062, -1.9230, -2.0775],
        [-2.5272, -2.2408, -2.0733,  0.5615,  2.5906,  0.7760],
        [-1.2268, -2.8839, -1.8836, -0.7011,  2.2227,  0.8858],
        [ 1.1185,  0.6069, -0.3519, -0.0074,  0.7829,  0.4266],
        [ 3.1267, -0.1395,  2.8693,  0.5765, -2.4204, -1.2044],
        [ 3.1529,  0.9961,  2.7573,  0.0214, -1.8480,  0.2472],
        [ 2.3286, -0.2264, -1.4206,  1.1412, -2.3230, -1.0193],
        [-2.4817, -1.5788, -1.8363,  1.5851,  2.2929,  1.7800],
        [-2.1214, -1.8064, -1.9133, -0.3712,  1.5990,  1.0298],
        [ 1.4620, -0.2217, -0.8990,  0.0341,  1.4577,  0.4015],
        [ 1.8233,  0.3238,  1.5905,  0.3722, -1.0315, -1.1000]],
       device='cuda:0')
action: tensor([[ 0.1209,  0.9465, -0.9398, -0.4860,  0.3257, -0.1430],
        [ 0.9678, -0.1578,  0.9611,  0.5601, -0.3469,  0.0642],
        [ 0.9909,  0.5847,  0.9897, -0.1543, -0.9450, -0.9111],
        [ 0.7152,  0.8431,  0.7752, -0.0288, -0.8692, -0.7966],
        [ 0.9340,  0.3104, -0.9336, -0.0945, -0.9682, -0.8740],
        [-0.8094, -0.9729, -0.9656,  0.3164,  0.9262,  0.1751],
        [-0.9691, -0.9694, -0.8810, -0.4982,  0.9878,  0.8825],
        [ 0.9240,  0.6502, -0.9622, -0.7284,  0.8327, -0.1493],
        [ 0.9729,  0.6670,  0.9620,  0.3888, -0.8288,  0.1225],
        [-0.9927,  0.9330, -0.9096, -0.5810, -0.1566,  0.5384],
        [ 0.8471,  0.9491, -0.8509, -0.8128,  0.3875, -0.3965],
        [ 0.9769, -0.8060,  0.9519, -0.9477, -0.8903, -0.9222],
        [ 0.9707,  0.8030, -0.9862,  0.0095, -0.9655, -0.9072],
        [-0.9895, -0.7450, -0.7579,  0.8672,  0.9848,  0.9563],
        [-0.9962, -0.9834, -0.9652, -0.8443,  0.9875,  0.9785],
        [ 0.9739, -0.1153,  0.0681,  0.9203,  0.8639,  0.7093],
        [ 0.9924, -0.0540,  0.9175,  0.8448, -0.9759, -0.9600],
        [ 0.9828, -0.1411,  0.9568,  0.9026, -0.9383, -0.7315],
        [ 0.8329, -0.8373, -0.9807,  0.9863, -0.9184,  0.6703],
        [-0.9812, -0.6678, -0.9826,  0.9958,  0.9600,  0.9225]],
       device='cuda:0')
squash tensor([[ 0.1215,  1.7968, -1.7361, -0.5308,  0.3380, -0.1440],
        [ 2.0564, -0.1591,  1.9598,  0.6330, -0.3619,  0.0643],
        [ 2.6923,  0.6695,  2.6309, -0.1555, -1.7830, -1.5339],
        [ 0.8977,  1.2318,  1.0332, -0.0288, -1.3299, -1.0891],
        [ 1.6891,  0.3210, -1.6860, -0.0947, -2.0622, -1.3496],
        [-1.1251, -2.1446, -2.0221,  0.3277,  1.6307,  0.1769],
        [-2.0781, -2.0824, -1.3801, -0.5470,  2.5454,  1.3871],
        [ 1.6155,  0.7757, -1.9749, -0.9252,  1.1969, -0.1504],
        [ 2.1430,  0.8052,  1.9725,  0.4104, -1.1844,  0.1232],
        [-2.8036,  1.6810, -1.5252, -0.6639, -0.1579,  0.6019],
        [ 1.2458,  1.8227, -1.2593, -1.1351,  0.4088, -0.4195],
        [ 2.2245, -1.1156,  1.8517, -1.8083, -1.4234, -1.6036],
        [ 2.1036,  1.1069, -2.4836,  0.0095, -2.0218, -1.5115],
        [-2.6220, -0.9616, -0.9912,  1.3215,  2.4371,  1.9007],
        [-3.1350, -2.3906, -2.0165, -1.2358,  2.5325,  2.2616],
        [ 2.1632, -0.1159,  0.0682,  1.5913,  1.3083,  0.8858],
        [ 2.7816, -0.0541,  1.5728,  1.2378, -2.2031, -1.9465],
        [ 2.3737, -0.1421,  1.9067,  1.4862, -1.7238, -0.9319],
        [ 1.1975, -1.2120, -2.3148,  2.4872, -1.5785,  0.8112],
        [-2.3291, -0.8068, -2.3688,  3.0817,  1.9458,  1.6055]],
       device='cuda:0')
action: tensor([[-0.9919, -0.9463, -0.9848,  0.6456,  0.9665,  0.9546],
        [-0.9738, -0.9859, -0.9609, -0.9572,  0.8496,  0.9602],
        [ 0.5750,  0.7032, -0.9122,  0.5178,  0.5162,  0.2031],
        [ 0.9634, -0.1340,  0.9825,  0.6364, -0.9702, -0.9665],
        [ 0.9962,  0.7486,  0.8887,  0.3139, -0.9672, -0.9176],
        [ 0.9727,  0.1512, -0.8636,  0.9836, -0.9658,  0.7844],
        [-0.9403, -0.8620, -0.9701,  0.9417,  0.9964,  0.9672],
        [-0.9880, -0.9628, -0.9907,  0.2749,  0.8663,  0.5923],
        [ 0.7424,  0.2432, -0.7812, -0.4099,  0.5460, -0.2866],
        [ 0.9859, -0.6676,  0.9952,  0.9528,  0.0604, -0.2424],
        [-0.9061, -0.1348,  0.4284, -0.1944,  0.7069,  0.8689],
        [ 0.8688,  0.3820,  0.9363, -0.0741,  0.3421, -0.8516],
        [ 0.9937, -0.2573,  0.3753, -0.4461, -0.3278, -0.2841],
        [ 0.9964,  0.5234,  0.3608, -0.1832, -0.9873, -0.9915],
        [ 0.9832, -0.4197, -0.2937, -0.2283, -0.8990, -0.9920],
        [-0.8915, -0.9794, -0.7264,  0.4371,  0.4644, -0.9506],
        [-0.9797, -0.9967, -0.8158, -0.7515,  0.9972, -0.0630],
        [-0.7565, -0.0565, -0.9461, -0.7954,  0.9633,  0.7671],
        [ 0.9564,  0.8750,  0.9731, -0.5153, -0.6835, -0.2853],
        [ 0.9881, -0.6861,  0.2068, -0.4500, -0.6795, -0.1787]],
       device='cuda:0')
squash tensor([[-2.7513, -1.7950, -2.4355,  0.7678,  2.0356,  1.8816],
        [-2.1611, -2.4733, -1.9579, -1.9113,  1.2547,  1.9483],
        [ 0.6550,  0.8736, -1.5405,  0.5733,  0.5711,  0.2060],
        [ 1.9916, -0.1349,  2.3648,  0.7521, -2.0954, -2.0365],
        [ 3.1361,  0.9698,  1.4156,  0.3249, -2.0475, -1.5738],
        [ 2.1406,  0.1524, -1.3075,  2.3966, -2.0263,  1.0568],
        [-1.7406, -1.3013, -2.0948,  1.7525,  3.1611,  2.0469],
        [-2.5570, -1.9834, -2.6857,  0.2822,  1.3182,  0.6812],
        [ 0.9558,  0.2482, -1.0484, -0.4355,  0.6127, -0.2949],
        [ 2.4725, -0.8064,  3.0101,  1.8610,  0.0605, -0.2473],
        [-1.5052, -0.1356,  0.4579, -0.1969,  0.8809,  1.3286],
        [ 1.3281,  0.4024,  1.7071, -0.0742,  0.3565, -1.2620],
        [ 2.8816, -0.2633,  0.3945, -0.4798, -0.3403, -0.2921],
        [ 3.1598,  0.5810,  0.3778, -0.1853, -2.5282, -2.7254],
        [ 2.3844, -0.4473, -0.3026, -0.2324, -1.4668, -2.7593],
        [-1.4292, -2.2836, -0.9211,  0.4686,  0.5029, -1.8377],
        [-2.2906, -3.2075, -1.1441, -0.9764,  3.2786, -0.0631],
        [-0.9880, -0.0566, -1.7928, -1.0860,  1.9900,  1.0132],
        [ 1.9016,  1.3542,  2.1486, -0.5699, -0.8356, -0.2935],
        [ 2.5598, -0.8405,  0.2098, -0.4847, -0.8282, -0.1806]],
       device='cuda:0')
action: tensor([[-0.9434, -0.9930, -0.9443, -0.6604,  0.9546,  0.6459],
        [ 0.8321,  0.9480, -0.9581, -0.7399,  0.2866,  0.3276],
        [ 0.9885, -0.0613,  0.9635,  0.2759, -0.5037, -0.0282],
        [ 0.9772,  0.1925,  0.7648, -0.0413, -0.8491, -0.9091],
        [ 0.8990,  0.6731,  0.7789,  0.1412, -0.9019, -0.9561],
        [ 0.9394,  0.4843, -0.5081,  0.1964, -0.9198, -0.9716],
        [-0.9668, -0.9236, -0.9530,  0.4256,  0.4933, -0.7181],
        [-0.8800, -0.9418, -0.8451, -0.6693,  0.9844,  0.8875],
        [ 0.3412,  0.7386, -0.9274, -0.7936, -0.5067, -0.1949],
        [ 0.9940, -0.0957,  0.9928,  0.5150, -0.9254, -0.5406],
        [ 0.9787,  0.0986,  0.9961,  0.2478, -0.8995, -0.9816],
        [ 0.6115, -0.4162, -0.3388,  0.9480, -0.9790, -0.7580],
        [-0.9716, -0.9078, -0.8568,  0.4977,  0.9059,  0.4785],
        [-0.9719, -0.9430, -0.9637, -0.5178,  0.8869,  0.6049],
        [ 0.3440,  0.6867, -0.8089, -0.4654,  0.3898, -0.2637],
        [ 0.9370, -0.3652,  0.9920,  0.4232, -0.7597,  0.4908],
        [ 0.9931, -0.1426,  0.9598,  0.5319, -0.8954, -0.7116],
        [ 0.9863, -0.6327, -0.1263,  0.8978, -0.4152, -0.8888],
        [-0.9758, -0.9928, -0.7916,  0.4419,  0.9641, -0.7726],
        [-0.9427, -0.9608, -0.9554, -0.6984,  0.9600,  0.4972]],
       device='cuda:0')
squash tensor([[-1.7681, -2.8289, -1.7767, -0.7935,  1.8810,  0.7682],
        [ 1.1949,  1.8116, -1.9227, -0.9502,  0.2949,  0.3402],
        [ 2.5772, -0.0614,  1.9933,  0.2832, -0.5543, -0.0282],
        [ 2.2319,  0.1950,  1.0076, -0.0413, -1.2529, -1.5223],
        [ 1.4672,  0.8164,  1.0427,  0.1422, -1.4823, -1.8979],
        [ 1.7330,  0.5285, -0.5602,  0.1989, -1.5874, -2.1204],
        [-2.0406, -1.6127, -1.8638,  0.4545,  0.5405, -0.9037],
        [-1.3756, -1.7541, -1.2389, -0.8095,  2.4216,  1.4102],
        [ 0.3554,  0.9474, -1.6393, -1.0810, -0.5583, -0.1974],
        [ 2.9060, -0.0959,  2.8143,  0.5694, -1.6256, -0.6050],
        [ 2.2665,  0.0989,  3.1132,  0.2531, -1.4697, -2.3390],
        [ 0.7113, -0.4431, -0.3528,  1.8114, -2.2729, -0.9915],
        [-2.1198, -1.5151, -1.2813,  0.5462,  1.5043,  0.5210],
        [-2.1259, -1.7647, -1.9952, -0.5733,  1.4072,  0.7009],
        [ 0.3586,  0.8417, -1.1239, -0.5042,  0.4116, -0.2700],
        [ 1.7125, -0.3828,  2.7590,  0.4516, -0.9956,  0.5372],
        [ 2.8297, -0.1436,  1.9432,  0.5928, -1.4483, -0.8905],
        [ 2.4888, -0.7459, -0.1270,  1.4610, -0.4418, -1.4161],
        [-2.2021, -2.8141, -1.0758,  0.4746,  2.0017, -1.0267],
        [-1.7614, -1.9562, -1.8899, -0.8642,  1.9454,  0.5456]],
       device='cuda:0')
action: tensor([[ 0.9955,  0.6066,  0.9927,  0.1818, -0.1527,  0.4137],
        [-0.9119, -0.3705, -0.8355,  0.3997, -0.1743,  0.6879],
        [-0.9720,  0.9702, -0.9732, -0.8195, -0.3827,  0.8096],
        [ 0.8926,  0.9539, -0.9198, -0.9198, -0.5424, -0.9894],
        [ 0.9683, -0.9558,  0.9828, -0.9814, -0.9686, -0.9590],
        [ 0.9994,  0.3406, -0.6621,  0.6859, -0.9878, -0.9587],
        [-0.9872, -0.9846, -0.9873,  0.6642,  0.9945,  0.8834],
        [-0.9930, -0.9666, -0.9432, -0.9842,  0.9713,  0.9466],
        [ 0.4031,  0.9417, -0.9659,  0.2936, -0.1383,  0.7515],
        [ 0.9821,  0.4555,  0.9744,  0.5144, -0.9175, -0.5780],
        [ 0.9898,  0.4980,  0.9855,  0.1980, -0.9548, -0.0971],
        [ 0.9933,  0.4837, -0.8011,  0.8222, -0.7627, -0.9655],
        [-0.9638, -0.9673, -0.9204,  0.5971,  0.9633,  0.7973],
        [-0.9459, -0.9459, -0.9792, -0.0452,  0.8961,  0.6536],
        [ 0.7668,  0.4749, -0.9028, -0.7351,  0.4617,  0.3211],
        [ 0.9829, -0.1027,  0.9807,  0.3935,  0.0193,  0.1693],
        [ 0.9913,  0.2967,  0.9535, -0.4128, -0.9444, -0.5049],
        [ 0.9846,  0.4674,  0.8744,  0.2868, -0.8843, -0.9785],
        [ 0.9576,  0.1976, -0.6094,  0.1141, -0.8593, -0.9391],
        [-0.9877, -0.9297, -0.8514,  0.0477,  0.8981, -0.6493]],
       device='cuda:0')
squash tensor([[ 3.0458,  0.7036,  2.8036,  0.1839, -0.1539,  0.4400],
        [-1.5388, -0.3890, -1.2061,  0.4233, -0.1761,  0.8440],
        [-2.1275,  2.0960, -2.1499, -1.1553, -0.4032,  1.1259],
        [ 1.4345,  1.8733, -1.5877, -1.5877, -0.6075, -2.6174],
        [ 2.0649, -1.8954,  2.3747, -2.3341, -2.0687, -1.9337],
        [ 4.0803,  0.3548, -0.7965,  0.8401, -2.5471, -1.9292],
        [-2.5216, -2.4284, -2.5277,  0.8002,  2.9434,  1.3911],
        [-2.8231, -2.0378, -1.7664, -2.4174,  2.1140,  1.7984],
        [ 0.4274,  1.7528, -2.0271,  0.3025, -0.1392,  0.9763],
        [ 2.3529,  0.4916,  2.1731,  0.5687, -1.5731, -0.6595],
        [ 2.6390,  0.5466,  2.4611,  0.2007, -1.8830, -0.0974],
        [ 2.8490,  0.5277, -1.1016,  1.1635, -1.0026, -2.0214],
        [-1.9966, -2.0486, -1.5916,  0.6887,  1.9903,  1.0912],
        [-1.7913, -1.7911, -2.2784, -0.0452,  1.4522,  0.7815],
        [ 1.0125,  0.5164, -1.4872, -0.9398,  0.4995,  0.3329],
        [ 2.3755, -0.1031,  2.3167,  0.4160,  0.0193,  0.1709],
        [ 2.7166,  0.3059,  1.8693, -0.4390, -1.7770, -0.5558],
        [ 2.4292,  0.5067,  1.3515,  0.2951, -1.3954, -2.2601],
        [ 1.9165,  0.2003, -0.7079,  0.1146, -1.2907, -1.7305],
        [-2.5440, -1.6563, -1.2611,  0.0477,  1.4623, -0.7740]],
       device='cuda:0')
action: tensor([[ 9.9293e-01,  4.2115e-01,  9.8707e-01, -5.2251e-02, -9.4562e-01,
         -4.1157e-01],
        [ 9.7660e-01, -7.8642e-03,  9.7992e-01,  4.3281e-01, -8.6569e-01,
         -3.1923e-01],
        [ 9.8011e-01,  3.4889e-01,  9.1248e-01,  5.6171e-01, -9.5644e-01,
         -9.7528e-01],
        [ 8.3405e-01, -9.0921e-02, -9.1471e-01,  5.8574e-01, -9.7863e-01,
         -7.1094e-01],
        [-9.7498e-01, -9.6866e-01, -9.0456e-01,  5.3834e-01,  8.9961e-01,
          3.4751e-02],
        [-8.8711e-01, -9.9398e-01, -9.9024e-01, -7.7421e-01,  9.4740e-01,
          5.9481e-01],
        [ 8.6758e-01,  8.5574e-01, -7.0343e-01, -4.2705e-01,  8.2506e-01,
         -4.2635e-03],
        [ 9.7158e-01, -3.5515e-01,  9.8306e-01,  5.6347e-01, -8.8454e-01,
          9.2959e-02],
        [ 9.6704e-01,  1.5214e-01,  9.7116e-01,  6.3688e-01, -9.2068e-01,
         -9.7651e-02],
        [ 5.1418e-01, -7.4852e-01, -5.3565e-01,  9.5805e-01, -8.5945e-01,
         -2.0952e-01],
        [-9.7837e-01, -9.8537e-01, -9.6886e-01,  5.8167e-01,  9.7930e-01,
         -9.7391e-03],
        [-9.6264e-01, -9.7904e-01, -9.3872e-01, -1.4212e-01,  9.5814e-01,
          8.6651e-01],
        [ 8.9909e-01,  9.3885e-01, -9.5797e-01, -4.8509e-01, -3.5657e-01,
          7.9705e-02],
        [ 8.5745e-01, -2.6562e-01,  9.9003e-01,  6.3126e-01, -7.4791e-01,
         -9.4713e-01],
        [ 9.7976e-01,  5.4841e-01,  9.6575e-01,  1.7261e-02, -8.1853e-01,
         -5.2470e-01],
        [ 8.8781e-01,  2.3970e-01, -6.0278e-01,  6.4786e-01, -9.6404e-01,
         -2.8074e-01],
        [-9.9313e-01, -9.7670e-01, -9.9111e-01,  7.4118e-01,  9.3335e-01,
          8.4485e-01],
        [-9.7100e-01, -9.9367e-01, -9.0848e-01, -6.9266e-01,  8.1596e-01,
          6.7734e-01],
        [ 7.2388e-01,  6.3909e-01, -8.6739e-01, -3.4132e-01,  9.5072e-01,
          1.4086e-01],
        [ 9.6381e-01, -8.7568e-01,  9.8917e-01,  6.2418e-04, -9.0438e-01,
          1.2874e-01]], device='cuda:0')
squash tensor([[ 2.8207e+00,  4.4909e-01,  2.5175e+00, -5.2299e-02, -1.7887e+00,
         -4.3750e-01],
        [ 2.2181e+00, -7.8644e-03,  2.2956e+00,  4.6335e-01, -1.3156e+00,
         -3.3079e-01],
        [ 2.3003e+00,  3.6418e-01,  1.5422e+00,  6.3533e-01, -1.9024e+00,
         -2.1904e+00],
        [ 1.2013e+00, -9.1173e-02, -1.5556e+00,  6.7116e-01, -2.2641e+00,
         -8.8909e-01],
        [-2.1844e+00, -2.0702e+00, -1.4967e+00,  6.0181e-01,  1.4702e+00,
          3.4765e-02],
        [-1.4082e+00, -2.9017e+00, -2.6589e+00, -1.0308e+00,  1.8057e+00,
          6.8508e-01],
        [ 1.3232e+00,  1.2772e+00, -8.7405e-01, -4.5628e-01,  1.1725e+00,
         -4.2635e-03],
        [ 2.1197e+00, -3.7132e-01,  2.3815e+00,  6.3790e-01, -1.3962e+00,
          9.3229e-02],
        [ 2.0445e+00,  1.5333e-01,  2.1124e+00,  7.5290e-01, -1.5935e+00,
         -9.7963e-02],
        [ 5.6840e-01, -9.6957e-01, -5.9804e-01,  1.9216e+00, -1.2912e+00,
         -2.1267e-01],
        [-2.2579e+00, -2.4553e+00, -2.0734e+00,  6.6498e-01,  2.2802e+00,
         -9.7394e-03],
        [-1.9807e+00, -2.2739e+00, -1.7272e+00, -1.4309e-01,  1.9228e+00,
          1.3189e+00],
        [ 1.4675e+00,  1.7283e+00, -1.9207e+00, -5.2962e-01, -3.7295e-01,
          7.9874e-02],
        [ 1.2836e+00, -2.7215e-01,  2.6484e+00,  7.4351e-01, -9.6819e-01,
         -1.8031e+00],
        [ 2.2916e+00,  6.1610e-01,  2.0250e+00,  1.7262e-02, -1.1524e+00,
         -5.8280e-01],
        [ 1.4115e+00,  2.4446e-01, -6.9750e-01,  7.7161e-01, -2.0002e+00,
         -2.8849e-01],
        [-2.8349e+00, -2.2204e+00, -2.7058e+00,  9.5309e-01,  1.6838e+00,
          1.2379e+00],
        [-2.1094e+00, -2.8764e+00, -1.5188e+00, -8.5304e-01,  1.1446e+00,
          8.2419e-01],
        [ 9.1575e-01,  7.5663e-01, -1.3224e+00, -3.5559e-01,  1.8392e+00,
          1.4180e-01],
        [ 1.9969e+00, -1.3569e+00,  2.6066e+00,  6.2418e-04, -1.4958e+00,
          1.2945e-01]], device='cuda:0')
action: tensor([[ 0.9036,  0.6411, -0.8878,  0.8479,  0.7318,  0.1438],
        [ 0.9623,  0.3018,  0.9131, -0.4900, -0.5211, -0.0090],
        [ 0.9771, -0.8424,  0.9872, -0.0639, -0.9000, -0.4899],
        [ 0.9969,  0.5632,  0.9965,  0.7995, -0.9529, -0.5598],
        [ 0.9382, -0.0290, -0.7632,  0.0274, -0.9204, -0.9526],
        [-0.9889, -0.8983, -0.9041,  0.5028,  0.9457, -0.6775],
        [-0.9455, -0.9845, -0.9497, -0.4362,  0.9750,  0.8334],
        [-0.2915,  0.9164, -0.8657, -0.7851, -0.1537, -0.8740],
        [ 0.9919,  0.3417,  0.9907,  0.5730, -0.9354, -0.6151],
        [ 0.9936,  0.6883,  0.9578, -0.1030, -0.9859, -0.9031],
        [ 0.9718, -0.6032, -0.9858,  0.9720, -0.8330, -0.8282],
        [-0.9983, -0.9646, -0.9854,  0.8296,  0.9626,  0.9583],
        [-0.9752, -0.9947, -0.9775, -0.7827,  0.8955,  0.6212],
        [ 0.3339,  0.3750, -0.9284, -0.7199,  0.1850,  0.8950],
        [ 0.9593, -0.2041,  0.9008,  0.3140, -0.5188,  0.2236],
        [ 0.6260,  0.6089,  0.9306,  0.7303, -0.8348,  0.2533],
        [ 0.9570, -0.5010, -0.0695,  0.8232, -0.8848, -0.8661],
        [-0.8965, -0.8723, -0.9894,  0.5285,  0.9746, -0.7283],
        [-0.8312, -0.9425, -0.9129, -0.9531,  0.7798, -0.5341],
        [-0.5176,  0.9908, -0.9608, -0.9782,  0.5480,  0.8018]],
       device='cuda:0')
squash tensor([[ 1.4914,  0.7600, -1.4115,  1.2487,  0.9326,  0.1448],
        [ 1.9761,  0.3115,  1.5459, -0.5360, -0.5779, -0.0090],
        [ 2.2286, -1.2293,  2.5237, -0.0640, -1.4723, -0.5359],
        [ 3.2343,  0.6375,  3.1729,  1.0972, -1.8625, -0.6325],
        [ 1.7232, -0.0291, -1.0039,  0.0274, -1.5917, -1.8595],
        [-2.5941, -1.4633, -1.4942,  0.5530,  1.7899, -0.8244],
        [-1.7871, -2.4257, -1.8284, -0.4675,  2.1846,  1.1991],
        [-0.3002,  1.5660, -1.3156, -1.0585, -0.1549, -1.3496],
        [ 2.7508,  0.3560,  2.6814,  0.6520, -1.7002, -0.7171],
        [ 2.8716,  0.8447,  1.9187, -0.1034, -2.4736, -1.4888],
        [ 2.1237, -0.6981, -2.4709,  2.1276, -1.1977, -1.1823],
        [-3.5462, -2.0075, -2.4572,  1.1870,  1.9797,  1.9246],
        [-2.1894, -2.9625, -2.2389, -1.0524,  1.4488,  0.7270],
        [ 0.3472,  0.3942, -1.6469, -0.9075,  0.1871,  1.4463],
        [ 1.9367, -0.2070,  1.4765,  0.3250, -0.5746,  0.2274],
        [ 0.7349,  0.7072,  1.6626,  0.9293, -1.2039,  0.2589],
        [ 1.9090, -0.5507, -0.0696,  1.1668, -1.3973, -1.3174],
        [-1.4539, -1.3426, -2.6172,  0.5881,  2.1760, -0.9250],
        [-1.1919, -1.7604, -1.5448, -1.8645,  1.0449, -0.5958],
        [-0.5730,  2.6877, -1.9567, -2.2537,  0.6155,  1.1036]],
       device='cuda:0')
action: tensor([[-0.9405, -0.9639, -0.9806,  0.3380,  0.9580,  0.1162],
        [-0.9782, -0.9878, -0.9959, -0.6353,  0.9943,  0.7536],
        [ 0.9479,  0.5274, -0.6825, -0.3523,  0.9529,  0.8189],
        [ 0.9722, -0.3321,  0.9899,  0.3826, -0.7441, -0.3454],
        [ 0.9684,  0.2152,  0.9315, -0.4321, -0.8891, -0.4573],
        [ 0.9551,  0.6447,  0.8133,  0.4448, -0.9675, -0.7406],
        [ 0.9366,  0.4935, -0.4748, -0.0301, -0.9870, -0.8737],
        [-0.9792, -0.9586, -0.8753,  0.5413,  0.8291, -0.1349],
        [-0.9752, -0.9404, -0.9724, -0.6889,  0.9761,  0.8233],
        [ 0.7676,  0.3817, -0.2216,  0.1404,  0.8319, -0.0328],
        [ 0.9979,  0.3858,  0.9521,  0.6640, -0.8042, -0.5059],
        [ 0.9858,  0.6435,  0.9929,  0.6327, -0.9714, -0.7987],
        [ 0.9749,  0.0287, -0.7603,  0.9568, -0.8141,  0.7289],
        [-0.9880, -0.9725, -0.9273,  0.9175,  0.9914,  0.9862],
        [-0.9393, -0.9762, -0.9917, -0.1325,  0.9429,  0.8815],
        [ 0.9912, -0.1983, -0.8641,  0.1938,  0.9238, -0.0651],
        [ 0.9723, -0.1209,  0.8626,  0.4716, -0.8238,  0.9378],
        [-0.9311,  0.2396, -0.9413,  0.6642, -0.1872,  0.8216],
        [ 0.7212,  0.9573, -0.9832, -0.9536,  0.3297, -0.0600],
        [ 0.9979, -0.5199,  0.9870, -0.8616, -0.8593, -0.8889]],
       device='cuda:0')
squash tensor([[-1.7420, -1.9979, -2.3129,  0.3518,  1.9209,  0.1167],
        [-2.2545, -2.5469, -3.0949, -0.7503,  2.9249,  0.9813],
        [ 1.8106,  0.5865, -0.8338, -0.3681,  1.8629,  1.1535],
        [ 2.1312, -0.3452,  2.6408,  0.4031, -0.9596, -0.3602],
        [ 2.0663,  0.2186,  1.6696, -0.4625, -1.4178, -0.4938],
        [ 1.8873,  0.7662,  1.1366,  0.4782, -2.0517, -0.9518],
        [ 1.7100,  0.5407, -0.5163, -0.0301, -2.5134, -1.3487],
        [-2.2770, -1.9289, -1.3553,  0.6060,  1.1853, -0.1357],
        [-2.1882, -1.7415, -2.1353, -0.8459,  2.2083,  1.1670],
        [ 1.0144,  0.4020, -0.2254,  0.1413,  1.1943, -0.0328],
        [ 3.4233,  0.4068,  1.8536,  0.7999, -1.1104, -0.5572],
        [ 2.4700,  0.7641,  2.8197,  0.7459, -2.1168, -1.0951],
        [ 2.1824,  0.0287, -0.9969,  1.9065, -1.1389,  0.9264],
        [-2.5539, -2.1361, -1.6389,  1.5732,  2.7249,  2.4857],
        [-1.7318, -2.2105, -2.7410, -0.1333,  1.7631,  1.3824],
        [ 2.7124, -0.2010, -1.3095,  0.1963,  1.6146, -0.0652],
        [ 2.1319, -0.1215,  1.3033,  0.5122, -1.1685,  1.7191],
        [-1.6663,  0.2443, -1.7490,  0.8003, -0.1894,  1.1616],
        [ 0.9101,  1.9128, -2.3856, -1.8695,  0.3425, -0.0601],
        [ 3.4375, -0.5762,  2.5155, -1.2993, -1.2906, -1.4166]],
       device='cuda:0')
action: tensor([[ 0.9761, -0.6128, -0.9251,  0.9219, -0.8202, -0.5954],
        [-0.9616, -0.8579, -0.9631,  0.9026,  0.9768,  0.8457],
        [-0.9689, -0.9941, -0.9647, -0.7356,  0.9827,  0.7196],
        [ 0.3017,  0.7366, -0.9934, -0.6069,  0.7108,  0.6445],
        [ 0.9918,  0.0709,  0.9833,  0.4902, -0.6901,  0.4067],
        [ 0.9523,  0.1242,  0.9266,  0.2396, -0.8179, -0.7259],
        [ 0.9674, -0.7460, -0.1795,  0.8488, -0.9043, -0.9522],
        [-0.9817, -0.7945, -0.9723,  0.5289,  0.9731, -0.6295],
        [-0.9538, -0.9812, -0.9260, -0.5869,  0.9382, -0.0512],
        [ 0.3147,  0.7743, -0.9684, -0.8840,  0.4527,  0.7463],
        [ 0.9955, -0.5661,  0.9900,  0.2808, -0.9524, -0.9767],
        [ 0.9840,  0.6040,  0.9785, -0.4668, -0.9907,  0.0134],
        [ 0.9803, -0.0592, -0.8854,  0.8862, -0.8748,  0.3336],
        [-0.9931, -0.4565, -0.7755,  0.6055,  0.9831,  0.8900],
        [-0.9806, -0.9886, -0.9541, -0.4857,  0.9930,  0.9474],
        [ 0.9005,  0.2700, -0.8246, -0.1215,  0.3785, -0.2994],
        [ 0.9778, -0.3967,  0.9978,  0.3761, -0.8994, -0.1024],
        [ 0.9679, -0.3687,  0.9696, -0.1203, -0.7471, -0.8230],
        [ 0.9975,  0.8127,  0.9994,  0.4736, -0.9772, -0.6923],
        [ 0.9612,  0.4128, -0.9265,  0.2402, -0.9898, -0.9645]],
       device='cuda:0')
squash tensor([[ 2.2066, -0.7134, -1.6236,  1.6015, -1.1576, -0.6859],
        [-1.9670, -1.2853, -1.9874,  1.4861,  2.2222,  1.2407],
        [-2.0748, -2.9156, -2.0100, -0.9408,  2.3717,  0.9069],
        [ 0.3114,  0.9431, -2.8520, -0.7040,  0.8888,  0.7658],
        [ 2.7487,  0.0710,  2.3896,  0.5364, -0.8481,  0.4317],
        [ 1.8564,  0.1248,  1.6335,  0.2444, -1.1505, -0.9200],
        [ 2.0503, -0.9638, -0.1814,  1.2518, -1.4955, -1.8545],
        [-2.3432, -1.0834, -2.1328,  0.5887,  2.1485, -0.7406],
        [-1.8727, -2.3285, -1.6298, -0.6730,  1.7225, -0.0512],
        [ 0.3257,  1.0309, -2.0651, -1.3937,  0.4881,  0.9646],
        [ 3.0419, -0.6418,  2.6477,  0.2885, -1.8573, -2.2205],
        [ 2.4098,  0.6995,  2.2609, -0.5060, -2.6853,  0.0134],
        [ 2.3048, -0.0592, -1.4002,  1.4042, -1.3533,  0.3469],
        [-2.8333, -0.4929, -1.0340,  0.7018,  2.3833,  1.4218],
        [-2.3136, -2.5800, -1.8758, -0.5304,  2.8227,  1.8061],
        [ 1.4749,  0.2768, -1.1710, -0.1221,  0.3983, -0.3089],
        [ 2.2451, -0.4197,  3.4116,  0.3955, -1.4690, -0.1027],
        [ 2.0575, -0.3869,  2.0852, -0.1208, -0.9664, -1.1662],
        [ 3.3473,  1.1351,  4.0384,  0.5147, -2.2321, -0.8523],
        [ 1.9620,  0.4390, -1.6334,  0.2450, -2.6382, -2.0064]],
       device='cuda:0')
action: tensor([[-0.9419, -0.9778, -0.9628, -0.6016,  0.7676,  0.4097],
        [ 0.9889,  0.6898, -0.9875, -0.6267,  0.5981, -0.0661],
        [ 0.9712, -0.4004,  0.9784,  0.0520, -0.7557,  0.0634],
        [ 0.9822,  0.2782,  0.7525,  0.0324, -0.3656, -0.4118],
        [ 0.9631,  0.5866,  0.9792,  0.2693, -0.8514, -0.8078],
        [ 0.8421, -0.1382, -0.9821,  0.0050, -0.9908, -0.9806],
        [-0.9932, -0.9770, -0.9486,  0.5368,  0.8317, -0.7388],
        [-0.9664, -0.9994, -0.9544, -0.7615,  0.9918,  0.9086],
        [ 0.6560,  0.6646, -0.8109, -0.7742,  0.0719, -0.0913],
        [ 0.8733, -0.0396,  0.9942,  0.6264, -0.9387, -0.2897],
        [ 0.9588, -0.2448,  0.9170,  0.4544, -0.9212, -0.6181],
        [ 0.9710,  0.2947, -0.4190,  0.9525, -0.8661, -0.1458],
        [-0.9926, -0.6972, -0.9347,  0.6372,  0.8231,  0.4544],
        [-0.8725, -0.9701, -0.9833, -0.0643,  0.7697,  0.8840],
        [ 0.7928,  0.4553, -0.9440, -0.3044, -0.2962, -0.0972],
        [ 0.9907,  0.3847,  0.9876,  0.3754, -0.7356, -0.4348],
        [ 0.9962,  0.2143,  0.9861, -0.0416, -0.8661,  0.4474],
        [ 0.9840,  0.2948,  0.2757,  0.3656, -0.9696, -0.8719],
        [ 0.9859, -0.1596, -0.8940,  0.4917, -0.9700, -0.9195],
        [-0.9958, -0.9143, -0.3091,  0.1299,  0.8983,  0.5450]],
       device='cuda:0')
squash tensor([[-1.7545, -2.2439, -1.9826, -0.6957,  1.0145,  0.4353],
        [ 2.5940,  0.8476, -2.5328, -0.7359,  0.6902, -0.0662],
        [ 2.1134, -0.4241,  2.2580,  0.0520, -0.9861,  0.0635],
        [ 2.3555,  0.2857,  0.9788,  0.0324, -0.3834, -0.4378],
        [ 1.9864,  0.6724,  2.2774,  0.2761, -1.2613, -1.1208],
        [ 1.2284, -0.1391, -2.3528,  0.0050, -2.6906, -2.3133],
        [-2.8437, -2.2259, -1.8179,  0.5996,  1.1935, -0.9478],
        [-2.0345, -4.0796, -1.8793, -0.9998,  2.7461,  1.5192],
        [ 0.7858,  0.8009, -1.1296, -1.0308,  0.0721, -0.0915],
        [ 1.3466, -0.0397,  2.9214,  0.7355, -1.7273, -0.2982],
        [ 1.9310, -0.2499,  1.5698,  0.4903, -1.5972, -0.7219],
        [ 2.1097,  0.3037, -0.4465,  1.8582, -1.3173, -0.1468],
        [-2.7989, -0.8618, -1.6941,  0.7534,  1.1665,  0.4902],
        [-1.3435, -2.0932, -2.3876, -0.0644,  1.0196,  1.3939],
        [ 1.0790,  0.4914, -1.7733, -0.3144, -0.3053, -0.0976],
        [ 2.6808,  0.4056,  2.5399,  0.3947, -0.9408, -0.4658],
        [ 3.1306,  0.2177,  2.4816, -0.0416, -1.3173,  0.4815],
        [ 2.4107,  0.3038,  0.2830,  0.3833, -2.0849, -1.3412],
        [ 2.4749, -0.1610, -1.4416,  0.5383, -2.0922, -1.5855],
        [-3.0834, -1.5531, -0.3196,  0.1306,  1.4632,  0.6113]],
       device='cuda:0')
action: tensor([[-0.9944, -0.9904, -0.9525,  0.0048,  0.9405,  0.9313],
        [-0.9859, -0.9812, -0.9707, -0.9100,  0.9522,  0.5122],
        [ 0.9751, -0.4413,  0.9950,  0.6582,  0.7866,  0.8701],
        [ 0.9566, -0.0623,  0.9895,  0.2044, -0.6792, -0.3811],
        [ 0.9987, -0.2349,  0.9792,  0.7812, -0.9305, -0.9213],
        [ 0.9251, -0.6628, -0.7236,  0.9519, -0.9794, -0.6567],
        [-0.9946, -0.9849, -0.9647,  0.9923,  0.9863,  0.9455],
        [-0.8236, -0.8757, -0.9713, -0.2044,  0.9767,  0.9482],
        [-0.0860,  0.6724, -0.9637, -0.2844,  0.1516, -0.2972],
        [ 0.9928,  0.9147,  0.9846,  0.4450, -0.9768, -0.5925],
        [ 0.9986,  0.7620,  0.9865,  0.5979, -0.9437, -0.4323],
        [ 0.9857,  0.2605, -0.8880,  0.7981, -0.9873, -0.2719],
        [-0.9479, -0.6418, -0.7485,  0.7527,  0.9400,  0.3376],
        [-0.9045, -0.9496, -0.9431, -0.3685,  0.9652,  0.9192],
        [ 0.4496,  0.5115, -0.8597, -0.5225,  0.7547,  0.2075],
        [ 0.9787,  0.1968,  0.9801,  0.7360, -0.2113,  0.3894],
        [ 0.0693, -0.7029,  0.6698,  0.9627, -0.6308, -0.3981],
        [ 0.8700, -0.8446, -0.0709,  0.9076, -0.9695, -0.2655],
        [-0.9906, -0.9960, -0.9685,  0.8371,  0.9847, -0.8963],
        [-0.9746, -0.9923, -0.9043, -0.9573,  0.8800, -0.4390]],
       device='cuda:0')
squash tensor([[-2.9407, -2.6666, -1.8583,  0.0048,  1.7422,  1.6681],
        [-2.4756, -2.3294, -2.1051, -1.5276,  1.8545,  0.5657],
        [ 2.1860, -0.4739,  2.9978,  0.7896,  1.0624,  1.3336],
        [ 1.9045, -0.0624,  2.6216,  0.2073, -0.8276, -0.4014],
        [ 3.6579, -0.2393,  2.2779,  1.0486, -1.6621, -1.5976],
        [ 1.6231, -0.7979, -0.9152,  1.8519, -2.2818, -0.7870],
        [-2.9595, -2.4393, -2.0100,  2.7805,  2.4876,  1.7879],
        [-1.1680, -1.3571, -2.1145, -0.2073,  2.2213,  1.8141],
        [-0.0862,  0.8152, -1.9951, -0.2924,  0.1528, -0.3065],
        [ 2.8089,  1.5557,  2.4297,  0.4785, -2.2222, -0.6815],
        [ 3.6287,  1.0010,  2.4958,  0.6899, -1.7707, -0.4627],
        [ 2.4663,  0.2666, -1.4125,  1.0935, -2.5280, -0.2790],
        [-1.8108, -0.7613, -0.9695,  0.9791,  1.7376,  0.3514],
        [-1.4967, -1.8275, -1.7656, -0.3866,  2.0170,  1.5840],
        [ 0.4841,  0.5648, -1.2923, -0.5798,  0.9837,  0.2106],
        [ 2.2655,  0.1994,  2.2994,  0.9417, -0.2145,  0.4111],
        [ 0.0694, -0.8731,  0.8104,  1.9818, -0.7428, -0.4213],
        [ 1.3332, -1.2369, -0.0710,  1.5137, -2.0846, -0.2720],
        [-2.6784, -3.1028, -2.0672,  1.2115,  2.4339, -1.4529],
        [-2.1763, -2.7771, -1.4955, -1.9121,  1.3757, -0.4710]],
       device='cuda:0')
action: tensor([[ 8.0476e-01,  1.1394e-01, -7.0482e-01,  2.6929e-01, -9.6532e-01,
         -3.0081e-01],
        [-9.6794e-01, -8.8621e-01, -9.5155e-01,  4.5569e-01,  9.6475e-01,
          8.6019e-01],
        [-9.9668e-01, -9.4522e-01, -9.8766e-01,  2.2208e-02,  9.7455e-01,
          7.5357e-01],
        [ 9.8226e-01,  4.7854e-01, -3.9940e-01, -1.4860e-01,  5.9206e-01,
         -6.3587e-01],
        [ 9.8846e-01,  6.9011e-02,  8.3829e-01,  6.7135e-01, -9.5661e-01,
          3.9042e-01],
        [ 9.6401e-01, -7.7236e-02,  9.8599e-01,  1.9935e-01, -8.7705e-01,
         -8.8086e-01],
        [ 9.9695e-01,  7.1223e-01,  9.6606e-01,  4.1323e-01, -8.6457e-01,
         -9.5665e-01],
        [ 8.4294e-01, -1.0503e-01, -9.2337e-01,  1.7453e-01, -9.3705e-01,
         -7.9348e-01],
        [-9.9441e-01, -8.5475e-01, -9.2389e-01,  2.9826e-01,  9.7871e-01,
         -1.7033e-01],
        [-9.5830e-01, -8.9301e-01, -9.7713e-01, -2.8403e-01,  8.2059e-01,
          9.7693e-01],
        [ 6.2570e-01,  6.1933e-01, -9.3485e-01, -4.7200e-01,  4.2045e-01,
          3.8105e-01],
        [ 9.8664e-01, -3.1266e-02,  6.4177e-01,  2.6789e-01, -6.1354e-01,
          8.8691e-01],
        [ 9.9346e-01,  4.3756e-04,  9.6614e-01,  4.0301e-02, -7.3551e-01,
         -8.6708e-01],
        [ 9.1940e-01, -4.2744e-01, -7.1857e-01,  8.5579e-01, -9.5484e-01,
         -7.4064e-01],
        [-9.9685e-01, -8.2925e-01, -8.5083e-01,  5.7790e-01,  9.7431e-01,
          2.7892e-01],
        [-9.1008e-01, -8.1940e-01, -9.7916e-01, -4.4992e-01,  7.0245e-01,
          2.8943e-01],
        [ 5.2996e-01,  7.7013e-01, -8.8778e-01, -8.7472e-01,  1.2997e-02,
         -3.5597e-01],
        [ 8.9780e-01, -4.9515e-02,  9.9247e-01,  5.7730e-01,  1.3084e-01,
         -7.3117e-01],
        [ 9.5218e-01,  5.2569e-01,  8.5698e-01,  1.6710e-01, -9.7033e-01,
         -3.6808e-01],
        [ 9.9540e-01, -4.7041e-01,  1.9674e-01,  7.2055e-01, -8.7184e-01,
         -6.0722e-01]], device='cuda:0')
squash tensor([[ 1.1120e+00,  1.1444e-01, -8.7681e-01,  2.7610e-01, -2.0187e+00,
         -3.1041e-01],
        [-2.0585e+00, -1.4040e+00, -1.8479e+00,  4.9186e-01,  2.0104e+00,
          1.2941e+00],
        [-3.2000e+00, -1.7849e+00, -2.5411e+00,  2.2212e-02,  2.1758e+00,
          9.8116e-01],
        [ 2.3582e+00,  5.2109e-01, -4.2293e-01, -1.4971e-01,  6.8083e-01,
         -7.5120e-01],
        [ 2.5745e+00,  6.9121e-02,  1.2154e+00,  8.1320e-01, -1.9044e+00,
          4.1230e-01],
        [ 1.9998e+00, -7.7390e-02,  2.4771e+00,  2.0206e-01, -1.3629e+00,
         -1.3796e+00],
        [ 3.2419e+00,  8.9169e-01,  2.0297e+00,  4.3950e-01, -1.3112e+00,
         -1.9049e+00],
        [ 1.2312e+00, -1.0542e-01, -1.6114e+00,  1.7633e-01, -1.7133e+00,
         -1.0807e+00],
        [-2.9389e+00, -1.2735e+00, -1.6150e+00,  3.0761e-01,  2.2660e+00,
         -1.7201e-01],
        [-1.9247e+00, -1.4366e+00, -2.2299e+00, -2.9206e-01,  1.1586e+00,
          2.2253e+00],
        [ 7.3432e-01,  7.2391e-01, -1.6955e+00, -5.1265e-01,  4.4823e-01,
          4.0129e-01],
        [ 2.5008e+00, -3.1276e-02,  7.6118e-01,  2.7459e-01, -7.1458e-01,
          1.4072e+00],
        [ 2.8597e+00,  4.3756e-04,  2.0308e+00,  4.0322e-02, -9.4064e-01,
         -1.3212e+00],
        [ 1.5851e+00, -4.5676e-01, -9.0469e-01,  1.2774e+00, -1.8839e+00,
         -9.5189e-01],
        [-3.2261e+00, -1.1857e+00, -1.2592e+00,  6.5930e-01,  2.1709e+00,
          2.8651e-01],
        [-1.5280e+00, -1.1550e+00, -2.2768e+00, -4.8461e-01,  8.7212e-01,
          2.9794e-01],
        [ 5.9009e-01,  1.0207e+00, -1.4113e+00, -1.3528e+00,  1.2997e-02,
         -3.7227e-01],
        [ 1.4608e+00, -4.9555e-02,  2.7889e+00,  6.5841e-01,  1.3160e-01,
         -9.3123e-01],
        [ 1.8546e+00,  5.8416e-01,  1.2819e+00,  1.6869e-01, -2.0978e+00,
         -3.8620e-01],
        [ 3.0362e+00, -5.1060e-01,  1.9934e-01,  9.0879e-01, -1.3407e+00,
         -7.0450e-01]], device='cuda:0')
action: tensor([[ 0.9867, -0.1285,  0.8762,  0.5478, -0.2999, -0.6490],
        [ 0.7745, -0.2217,  0.2888,  0.0816, -0.8429, -0.9788],
        [-0.8730, -0.9880, -0.9774,  0.1526,  0.1495, -0.9414],
        [-0.9868, -0.7769, -0.9432, -0.4321,  0.9499, -0.1528],
        [-0.2173,  0.1244, -0.8033, -0.9738,  0.5591,  0.4237],
        [ 0.9140,  0.9078,  0.5943, -0.8399, -0.8401, -0.6681],
        [ 0.9658,  0.3925,  0.9979, -0.5275, -0.9479, -0.6776],
        [ 0.9785,  0.2196,  0.7604,  0.3822, -0.7916, -0.4801],
        [ 0.9370,  0.5061, -0.9647,  0.3940, -0.9444, -0.8723],
        [-0.9983, -0.9890, -0.9294,  0.4588,  0.9632,  0.5543],
        [-0.9939, -0.8968, -0.9427, -0.7882,  0.9479,  0.8718],
        [ 0.8541,  0.2275, -0.8068,  0.5593,  0.9844,  0.7509],
        [ 0.9838, -0.5041,  0.9857, -0.1227, -0.8632, -0.5607],
        [ 0.9663, -0.4136,  0.9397,  0.0172, -0.9239, -0.7653],
        [ 0.9956,  0.0530,  0.9827,  0.7218, -0.9828, -0.9369],
        [ 0.8688,  0.2205, -0.8670,  0.5686, -0.9750, -0.9343],
        [-0.9906, -0.9872, -0.9815,  0.3235,  0.9705,  0.6633],
        [-0.9025, -0.9880, -0.9796, -0.5212,  0.8092,  0.8482],
        [ 0.8455,  0.5621, -0.7652,  0.4230,  0.8211,  0.4651],
        [ 0.9086,  0.0088,  0.9944,  0.4441, -0.8083, -0.7509]],
       device='cuda:0')
squash tensor([[ 2.5014, -0.1292,  1.3592,  0.6152, -0.3094, -0.7736],
        [ 1.0314, -0.2255,  0.2972,  0.0818, -1.2312, -2.2684],
        [-1.3456, -2.5558, -2.2368,  0.1538,  0.1506, -1.7503],
        [-2.5083, -1.0375, -1.7665, -0.4625,  1.8312, -0.1540],
        [-0.2208,  0.1250, -1.1078, -2.1608,  0.6315,  0.4522],
        [ 1.5510,  1.5151,  0.6842, -1.2209, -1.2215, -0.8073],
        [ 2.0252,  0.4148,  3.4348, -0.5866, -1.8110, -0.8247],
        [ 2.2610,  0.2232,  0.9973,  0.4027, -1.0758, -0.5231],
        [ 1.7129,  0.5575, -2.0099,  0.4165, -1.7772, -1.3424],
        [-3.5257, -2.5999, -1.6538,  0.4958,  1.9882,  0.6245],
        [-2.8935, -1.4558, -1.7617, -1.0666,  1.8102,  1.3407],
        [ 1.2710,  0.2315, -1.1179,  0.6318,  2.4238,  0.9750],
        [ 2.4031, -0.5547,  2.4663, -0.1233, -1.3059, -0.6339],
        [ 2.0334, -0.4399,  1.7356,  0.0172, -1.6151, -1.0089],
        [ 3.0635,  0.0530,  2.3702,  0.9114, -2.3747, -1.7123],
        [ 1.3281,  0.2242, -1.3208,  0.6454, -2.1841, -1.6914],
        [-2.6772, -2.5236, -2.3365,  0.3356,  2.1002,  0.7986],
        [-1.4857, -2.5548, -2.2884, -0.5780,  1.1248,  1.2498],
        [ 1.2401,  0.6359, -1.0086,  0.4514,  1.1603,  0.5037],
        [ 1.5197,  0.0088,  2.9370,  0.4773, -1.1221, -0.9749]],
       device='cuda:0')
action: tensor([[-0.9937, -0.9620, -0.9283,  0.2314,  0.9924,  0.8151],
        [ 0.4528,  0.0294, -0.8868, -0.8888,  0.4682,  0.5413],
        [ 0.9867,  0.4273,  0.9703,  0.6700, -0.1881,  0.9629],
        [ 0.8309, -0.7009,  0.7263,  0.5815, -0.0139,  0.1263],
        [-0.9905,  0.9770, -0.6951, -0.8931, -0.2411, -0.7283],
        [ 0.9997,  0.9961, -0.8179, -0.8925, -0.7669,  0.4514],
        [ 0.9997, -0.0113,  0.9851, -0.8463, -0.9924, -0.9105],
        [ 0.9424,  0.7513,  0.4428, -0.1790, -0.8456, -0.8101],
        [ 0.0573, -0.0772, -0.9235,  0.3214, -0.5145, -0.5713],
        [-0.9494, -0.9944, -0.8807,  0.2521,  0.9751,  0.6333],
        [-0.9783, -0.9882, -0.9719, -0.8062,  0.9298,  0.9310],
        [ 0.9399,  0.5772,  0.6460,  0.4579,  0.2058, -0.6548],
        [ 0.9897, -0.0966,  0.9553,  0.1445, -0.9213, -0.8883],
        [ 0.9764,  0.4929,  0.9756,  0.7387, -0.8792, -0.4987],
        [ 0.9228, -0.0930, -0.4164,  0.8862, -0.9707, -0.9250],
        [-0.9858, -0.9781, -0.8130,  0.6890,  0.9889,  0.8895],
        [-0.9927, -0.9509, -0.8326, -0.2607,  0.8738,  0.8342],
        [ 0.8424,  0.1456, -0.8512,  0.0181,  0.6764,  0.0339],
        [ 0.9914,  0.1942,  0.9966,  0.7885, -0.9473, -0.6774],
        [ 0.9842,  0.1964,  0.8915,  0.9639, -0.9205, -0.6702]],
       device='cuda:0')
squash tensor([[-2.8807, -1.9717, -1.6460,  0.2357,  2.7825,  1.1419],
        [ 0.4882,  0.0294, -1.4069, -1.4162,  0.5077,  0.6061],
        [ 2.5016,  0.4566,  2.0977,  0.8107, -0.1903,  1.9838],
        [ 1.1911, -0.8690,  0.9208,  0.6648, -0.0139,  0.1269],
        [-2.6706,  2.2278, -0.8578, -1.4370, -0.2459, -0.9252],
        [ 4.4555,  3.1130, -1.1503, -1.4340, -1.0128,  0.4864],
        [ 4.4783, -0.0113,  2.4464, -1.2430, -2.7859, -1.5304],
        [ 1.7594,  0.9759,  0.4757, -0.1810, -1.2404, -1.1272],
        [ 0.0574, -0.0773, -1.6126,  0.3332, -0.5688, -0.6495],
        [-1.8256, -2.9374, -1.3787,  0.2577,  2.1860,  0.7468],
        [-2.2575, -2.5616, -2.1263, -1.1161,  1.6570,  1.6662],
        [ 1.7371,  0.6582,  0.7685,  0.4947,  0.2087, -0.7837],
        [ 2.6302, -0.0969,  1.8888,  0.1455, -1.5977, -1.4138],
        [ 2.2132,  0.5399,  2.1978,  0.9476, -1.3720, -0.5475],
        [ 1.6076, -0.0933, -0.4433,  1.4038, -2.1044, -1.6223],
        [-2.4690, -2.2514, -1.1358,  0.8461,  2.5952,  1.4195],
        [-2.8016, -1.8415, -1.1965, -0.2669,  1.3488,  1.2016],
        [ 1.2293,  0.1467, -1.2607,  0.0181,  0.8224,  0.0339],
        [ 2.7200,  0.1967,  3.1823,  1.0676, -1.8053, -0.8244],
        [ 2.4174,  0.1990,  1.4293,  1.9979, -1.5923, -0.8111]],
       device='cuda:0')
action: tensor([[-0.9789, -0.9973, -0.9873, -0.8440,  0.9869,  0.9351],
        [ 0.9163,  0.0050, -0.1881, -0.1028,  0.8938,  0.6014],
        [ 0.9916, -0.5202,  0.9947,  0.4288, -0.9120, -0.7040],
        [ 0.9887,  0.1774,  0.8697, -0.2402, -0.9759, -0.9853],
        [ 0.9841,  0.6274,  0.7407,  0.3476, -0.9955, -0.8588],
        [ 0.9521,  0.3161, -0.9610,  0.4575, -0.9776, -0.8272],
        [-0.9783, -0.9678, -0.9942,  0.4185,  0.9877,  0.9104],
        [-0.9940, -0.9418, -0.9959,  0.1387,  0.8848,  0.5947],
        [ 0.9536, -0.1955, -0.3864,  0.4614,  0.8132,  0.7633],
        [ 0.9968,  0.5992,  0.9788,  0.3571, -0.4385, -0.1013],
        [ 0.9861, -0.9231,  0.9831,  0.9406, -0.9114, -0.6911],
        [ 0.8446, -0.7829,  0.4481,  0.8993, -0.8217, -0.9626],
        [-0.8163, -0.9827, -0.4333,  0.8499,  0.9756, -0.2904],
        [-0.9209, -0.9661, -0.4427, -0.8738,  0.8866, -0.0258],
        [ 0.7714,  0.3896, -0.7575, -0.2902,  0.9344,  0.0497],
        [ 0.9875,  0.1868,  0.9853, -0.1127, -0.9114, -0.6440],
        [ 0.7910, -0.3947,  0.8349,  0.8386, -0.9183, -0.6485],
        [ 0.2985, -0.9566, -0.9183,  0.9439, -0.7608, -0.8274],
        [-0.9656, -0.9833, -0.9799,  0.9901,  0.9686,  0.6895],
        [-0.8133, -0.9920, -0.9647, -0.8699,  0.9561,  0.6918]],
       device='cuda:0')
squash tensor([[-2.2697, -3.2989, -2.5255, -1.2348,  2.5110,  1.6972],
        [ 1.5657,  0.0050, -0.1904, -0.1031,  1.4407,  0.6954],
        [ 2.7316, -0.5766,  2.9672,  0.4584, -1.5392, -0.8752],
        [ 2.5830,  0.1793,  1.3320, -0.2450, -2.2043, -2.4518],
        [ 2.4139,  0.7371,  0.9520,  0.3627, -3.0428, -1.2888],
        [ 1.8538,  0.3273, -1.9592,  0.4941, -2.2409, -1.1792],
        [-2.2562, -2.0562, -2.9219,  0.4459,  2.5415,  1.5300],
        [-2.9010, -1.7539, -3.0937,  0.1396,  1.3976,  0.6849],
        [ 1.8703, -0.1981, -0.4076,  0.4990,  1.1365,  1.0042],
        [ 3.2194,  0.6919,  2.2686,  0.3736, -0.4704, -0.1017],
        [ 2.4820, -1.6094,  2.3813,  1.7433, -1.5359, -0.8501],
        [ 1.2370, -1.0529,  0.4824,  1.4686, -1.1622, -1.9802],
        [-1.1455, -2.3700, -0.4640,  1.2559,  2.1969, -0.2990],
        [-1.5949, -2.0296, -0.4756, -1.3488,  1.4058, -0.0258],
        [ 1.0239,  0.4113, -0.9904, -0.2987,  1.6921,  0.0497],
        [ 2.5364,  0.1890,  2.4540, -0.1131, -1.5358, -0.7649],
        [ 1.0740, -0.4173,  1.2040,  1.2166, -1.5783, -0.7726],
        [ 0.3078, -1.9040, -1.5778,  1.7729, -0.9982, -1.1799],
        [-2.0234, -2.3878, -2.2954,  2.6526,  2.0692,  0.8470],
        [-1.1368, -2.7570, -2.0091, -1.3325,  1.8987,  0.8513]],
       device='cuda:0')
action: tensor([[-0.9551, -0.8578, -0.9097, -0.1162,  0.8783, -0.4720],
        [-0.1116,  0.8404, -0.8981, -0.9429,  0.1360,  0.9382],
        [ 0.9946,  0.1544,  0.9734,  0.6664, -0.8652, -0.1396],
        [-0.6393, -0.0838, -0.9251,  0.5032,  0.8678, -0.2011],
        [-0.8906,  0.2706,  0.1238, -0.1190,  0.6014,  0.4691],
        [-0.8610,  0.6125, -0.8509, -0.8646,  0.0792,  0.1911],
        [-0.8490,  0.8106, -0.9900, -0.8931, -0.8498,  0.0973],
        [ 0.0053,  0.8520, -0.9806, -0.9627,  0.4546, -0.1314],
        [ 0.9901, -0.7836,  0.9893, -0.9958, -0.9455, -0.9021],
        [ 0.8866,  0.6641, -0.9663,  0.8121, -0.9087, -0.9757],
        [-0.9955, -0.9564, -0.9828,  0.9343,  0.9768,  0.9907],
        [-0.9730, -0.8333, -0.9702, -0.9603,  0.6615,  0.9266],
        [ 0.2320,  0.7035, -0.9201, -0.0045, -0.2342,  0.3464],
        [ 0.9473, -0.2611,  0.9853, -0.1329, -0.9531, -0.8908],
        [ 0.7813,  0.4554,  0.9661, -0.2937, -0.9908, -0.6967],
        [ 0.9430,  0.1341,  0.6438,  0.6852, -0.9775,  0.2963],
        [ 0.9569, -0.0369, -0.8939,  0.3900, -0.9831, -0.8753],
        [-0.9861, -0.9977, -0.9944,  0.7227,  0.9622,  0.8796],
        [-0.9823, -0.9483, -0.9753, -0.0093,  0.8396,  0.5699],
        [ 0.8565,  0.7212, -0.9384, -0.4703,  0.1195, -0.0759]],
       device='cuda:0')
squash tensor([[-1.8865, -1.2850, -1.5257, -0.1168,  1.3684, -0.5127],
        [-0.1120,  1.2226, -1.4622, -1.7638,  0.1369,  1.7231],
        [ 2.9559,  0.1556,  2.1524,  0.8043, -1.3139, -0.1405],
        [-0.7570, -0.0840, -1.6229,  0.5535,  1.3240, -0.2039],
        [-1.4249,  0.2776,  0.1244, -0.1196,  0.6954,  0.5090],
        [-1.2972,  0.7130, -1.2594, -1.3114,  0.0794,  0.1935],
        [-1.2526,  1.1288, -2.6480, -1.4368, -1.2555,  0.0976],
        [ 0.0053,  1.2634, -2.3125, -1.9817,  0.4905, -0.1321],
        [ 2.6540, -1.0547,  2.6128, -3.0787, -1.7875, -1.4834],
        [ 1.4060,  0.8000, -2.0328,  1.1331, -1.5198, -2.1993],
        [-3.0481, -1.9017, -2.3739,  1.6911,  2.2225,  2.6834],
        [-2.1455, -1.1988, -2.0963, -1.9493,  0.7954,  1.6337],
        [ 0.2363,  0.8742, -1.5895, -0.0045, -0.2386,  0.3613],
        [ 1.8049, -0.2673,  2.4543, -0.1337, -1.8641, -1.4260],
        [ 1.0488,  0.4915,  2.0302, -0.3026, -2.6881, -0.8609],
        [ 1.7642,  0.1349,  0.7646,  0.8388, -2.2376,  0.3055],
        [ 1.9077, -0.0370, -1.4410,  0.4117, -2.3828, -1.3555],
        [-2.4795, -3.3765, -2.9409,  0.9132,  1.9749,  1.3740],
        [-2.3590, -1.8149, -2.1917, -0.0093,  1.2198,  0.6474],
        [ 1.2799,  0.9102, -1.7242, -0.5104,  0.1201, -0.0760]],
       device='cuda:0')
action: tensor([[ 0.9746, -0.0535,  0.9914, -0.1024, -0.2184,  0.4100],
        [ 0.9463, -0.2149,  0.9295,  0.5715, -0.5220,  0.2537],
        [ 0.9609,  0.5961,  0.6184,  0.4410, -0.9492, -0.8586],
        [ 0.8763, -0.5182, -0.8624,  0.6007, -0.6731, -0.8301],
        [-0.9717, -0.9778, -0.8955,  0.5639,  0.9916, -0.5117],
        [-0.9943, -0.9888, -0.9856, -0.7452,  0.8703,  0.7414],
        [ 0.3664,  0.9064, -0.8660, -0.1553,  0.4104, -0.1218],
        [ 0.9535, -0.0826,  0.9937,  0.3817, -0.9843, -0.7999],
        [ 0.9943,  0.6149,  0.9602,  0.3740, -0.9549, -0.4992],
        [ 0.7203, -0.4474, -0.9214,  0.9587, -0.2909, -0.3932],
        [-0.9883, -0.9779, -0.9404,  0.7467,  0.9329, -0.0527],
        [-0.8889, -0.8528, -0.8655, -0.3487,  0.8811,  0.6349],
        [ 0.5453,  0.5731, -0.9558, -0.6111,  0.1353, -0.4900],
        [ 0.9723, -0.2563,  0.9925,  0.4574, -0.3591,  0.1085],
        [ 0.9889,  0.1795,  0.9625,  0.0555, -0.5296, -0.9717],
        [ 0.8147,  0.2580, -0.8398,  0.9324, -0.9761, -0.7089],
        [-0.9873, -0.9512, -0.7640,  0.6077,  0.9525,  0.5638],
        [-0.9828, -0.9906, -0.9708, -0.3220,  0.9499,  0.7073],
        [ 0.5721,  0.8574, -0.9384, -0.4551,  0.3925,  0.8805],
        [ 0.9742, -0.6454,  0.9802,  0.4926, -0.9623, -0.9802]],
       device='cuda:0')
squash tensor([[ 2.1770, -0.0535,  2.7196, -0.1027, -0.2220,  0.4357],
        [ 1.7955, -0.2183,  1.6546,  0.6497, -0.5791,  0.2594],
        [ 1.9573,  0.6872,  0.7224,  0.4735, -1.8238, -1.2881],
        [ 1.3597, -0.5738, -1.3027,  0.6942, -0.8163, -1.1885],
        [-2.1222, -2.2440, -1.4491,  0.6385,  2.7350, -0.5650],
        [-2.9281, -2.5915, -2.4639, -0.9620,  1.3341,  0.9537],
        [ 0.3843,  1.5068, -1.3169, -0.1565,  0.4360, -0.1224],
        [ 1.8693, -0.0827,  2.8747,  0.4021, -2.4184, -1.0984],
        [ 2.9305,  0.7167,  1.9481,  0.3931, -1.8841, -0.5483],
        [ 0.9082, -0.4815, -1.5983,  1.9295, -0.2995, -0.4156],
        [-2.5665, -2.2465, -1.7411,  0.9655,  1.6806, -0.0527],
        [-1.4167, -1.2662, -1.3150, -0.3640,  1.3806,  0.7495],
        [ 0.6117,  0.6522, -1.8944, -0.7107,  0.1362, -0.5361],
        [ 2.1332, -0.2622,  2.7938,  0.4940, -0.3759,  0.1090],
        [ 2.5944,  0.1814,  1.9784,  0.0556, -0.5895, -2.1219],
        [ 1.1409,  0.2639, -1.2205,  1.6764, -2.2084, -0.8850],
        [-2.5260, -1.8443, -1.0058,  0.7053,  1.8580,  0.6384],
        [-2.3724, -2.6756, -2.1059, -0.3339,  1.8310,  0.8818],
        [ 0.6506,  1.2836, -1.7248, -0.4912,  0.4148,  1.3778],
        [ 2.1686, -0.7674,  2.3018,  0.5395, -1.9760, -2.3017]],
       device='cuda:0')
action: tensor([[-0.9891, -0.9878, -0.9084, -0.7434,  0.7576,  0.9227],
        [ 0.8114,  0.6494, -0.7603,  0.1957,  0.4756,  0.0848],
        [ 0.9534, -0.7667,  0.9969,  0.6292, -0.9798, -0.2369],
        [ 0.9857,  0.6536,  0.9950,  0.4178, -0.9709, -0.6409],
        [ 0.9786,  0.0610, -0.8966,  0.8748, -0.9958, -0.0862],
        [-0.9963, -0.9768, -0.9323,  0.8663,  0.9836,  0.6690],
        [-0.9579, -0.9309, -0.9393, -0.3927,  0.9615,  0.5310],
        [ 0.6271,  0.4736, -0.8328,  0.1867,  0.9647,  0.3723],
        [ 0.9925, -0.3047,  0.9779,  0.1804, -0.9286,  0.2013],
        [ 0.9966, -0.6397,  0.9889,  0.3485, -0.8665, -0.8636],
        [ 0.9384, -0.6796, -0.1701,  0.9347, -0.9666, -0.8586],
        [-0.9958, -0.8871, -0.8170,  0.7802,  0.9414,  0.8368],
        [-0.9552, -0.9934, -0.9959, -0.5860,  0.8841,  0.5851],
        [ 0.9598,  0.2533, -0.4205,  0.3628,  0.9066,  0.4291],
        [ 0.9951,  0.4257,  0.9888,  0.7194, -0.9867, -0.8927],
        [ 0.9943,  0.1972,  0.9929,  0.6411, -0.9471, -0.6084],
        [ 0.9495, -0.6538, -0.9877,  0.9596, -0.9277,  0.1881],
        [-0.9941, -0.8728, -0.9448,  0.9911,  0.9854,  0.9490],
        [-0.9508, -0.9890, -0.9898,  0.1375,  0.9721,  0.7976],
        [ 0.6206,  0.8413, -0.9821, -0.9023, -0.4075,  0.4704]],
       device='cuda:0')
squash tensor([[-2.6017, -2.5456, -1.5183, -0.9580,  0.9905,  1.6068],
        [ 1.1312,  0.7743, -0.9970,  0.1983,  0.5173,  0.0850],
        [ 1.8677, -1.0123,  3.2384,  0.7401, -2.2937, -0.2415],
        [ 2.4665,  0.7815,  2.9949,  0.4450, -2.1079, -0.7597],
        [ 2.2627,  0.0611, -1.4545,  1.3533, -3.0788, -0.0864],
        [-3.1469, -2.2230, -1.6755,  1.3179,  2.3984,  0.8089],
        [-1.9198, -1.6653, -1.7320, -0.4150,  1.9659,  0.5916],
        [ 0.7366,  0.5147, -1.1974,  0.1890,  2.0091,  0.3911],
        [ 2.7942, -0.3147,  2.2467,  0.1824, -1.6484,  0.2041],
        [ 3.1888, -0.7576,  2.5935,  0.3637, -1.3190, -1.3073],
        [ 1.7244, -0.8283, -0.1718,  1.6941, -2.0384, -1.2880],
        [-3.0830, -1.4080, -1.1477,  1.0459,  1.7498,  1.2104],
        [-1.8882, -2.8517, -3.0929, -0.6715,  1.3944,  0.6702],
        [ 1.9429,  0.2589, -0.4483,  0.3801,  1.5082,  0.4587],
        [ 3.0016,  0.4547,  2.5894,  0.9064, -2.5043, -1.4351],
        [ 2.9317,  0.1999,  2.8174,  0.7600, -1.8030, -0.7064],
        [ 1.8266, -0.7818, -2.5441,  1.9404, -1.6414,  0.1904],
        [-2.9117, -1.3449, -1.7811,  2.7060,  2.4570,  1.8211],
        [-1.8401, -2.5998, -2.6347,  0.1383,  2.1299,  1.0920],
        [ 0.7260,  1.2257, -2.3537, -1.4845, -0.4326,  0.5105]],
       device='cuda:0')
action: tensor([[ 9.5973e-01, -2.5601e-01,  9.9498e-01,  6.4694e-01, -9.4389e-01,
         -7.5703e-01],
        [ 9.7122e-01, -4.6467e-01,  9.8531e-01,  7.8046e-01, -9.7327e-01,
         -3.2142e-01],
        [ 8.3394e-01, -7.6097e-01, -2.3549e-01,  9.2805e-01, -9.5524e-01,
         -3.2253e-01],
        [-9.9023e-01, -9.8004e-01, -9.9280e-01,  9.9171e-01,  9.9303e-01,
          8.7173e-01],
        [-9.2634e-01, -9.9036e-01, -9.4339e-01, -3.7929e-01,  9.1586e-01,
          6.6292e-01],
        [ 6.3954e-01,  8.0143e-01, -8.3260e-01, -4.6201e-01,  3.1124e-01,
          2.4432e-01],
        [ 9.8850e-01,  5.3130e-01,  8.8357e-01,  3.3652e-01, -9.2321e-01,
         -5.8776e-01],
        [ 9.8876e-01,  3.7618e-01,  9.7997e-01,  4.5578e-01, -7.0181e-01,
         -8.6791e-01],
        [ 8.1961e-01,  3.2085e-01, -1.7415e-01,  7.8320e-01, -9.4999e-01,
         -9.3258e-01],
        [-9.9278e-01, -6.7318e-01, -9.4340e-01,  3.6163e-01,  9.6383e-01,
         -1.5356e-01],
        [-9.9263e-01, -9.7213e-01, -9.0680e-01, -4.9130e-01,  9.9324e-01,
          3.7865e-01],
        [ 7.7037e-01,  6.0643e-01, -6.4861e-01, -8.4772e-01, -1.0141e-01,
          8.6888e-01],
        [ 9.7164e-01, -3.3139e-01,  9.8901e-01,  2.7757e-01, -7.7923e-01,
          2.1064e-01],
        [ 9.6706e-01,  2.6627e-01,  9.9517e-01, -1.3983e-01, -7.6567e-01,
         -7.2358e-01],
        [ 9.5338e-01,  4.7818e-01,  8.9520e-01,  4.5735e-04, -9.6903e-01,
         -8.8944e-01],
        [ 9.7578e-01,  2.4183e-01, -7.5244e-01,  4.4533e-01, -9.0243e-01,
         -9.7268e-01],
        [-9.7400e-01, -9.8123e-01, -9.1297e-01,  1.9497e-01,  9.5058e-01,
          2.8724e-01],
        [-9.7057e-01, -9.9601e-01, -9.3668e-01, -6.7975e-01,  9.6300e-01,
          9.7508e-01],
        [ 8.8729e-01,  4.0024e-01, -7.6118e-01, -9.3034e-02,  7.4118e-01,
          2.0782e-01],
        [ 9.8527e-01, -1.3524e-01,  9.7309e-01,  7.3937e-01, -9.3083e-01,
         -3.9916e-01]], device='cuda:0')
squash tensor([[ 1.9424e+00, -2.6183e-01,  2.9923e+00,  7.7002e-01, -1.7726e+00,
         -9.8922e-01],
        [ 2.1133e+00, -5.0325e-01,  2.4531e+00,  1.0466e+00, -2.1508e+00,
         -3.3323e-01],
        [ 1.2009e+00, -9.9851e-01, -2.3999e-01,  1.6442e+00, -1.8884e+00,
         -3.3446e-01],
        [-2.6581e+00, -2.2986e+00, -2.8116e+00,  2.7408e+00,  2.8278e+00,
          1.3403e+00],
        [-1.6320e+00, -2.6649e+00, -1.7680e+00, -3.9924e-01,  1.5627e+00,
          7.9800e-01],
        [ 7.5739e-01,  1.1026e+00, -1.1966e+00, -4.9986e-01,  3.2191e-01,
          2.4936e-01],
        [ 2.5765e+00,  5.9196e-01,  1.3918e+00,  3.5016e-01, -1.6104e+00,
         -6.7423e-01],
        [ 2.5878e+00,  3.9560e-01,  2.2968e+00,  4.9197e-01, -8.7085e-01,
         -1.3245e+00],
        [ 1.1556e+00,  3.3259e-01, -1.7594e-01,  1.0536e+00, -1.8316e+00,
         -1.6778e+00],
        [-2.8100e+00, -8.1653e-01, -1.7681e+00,  3.7877e-01,  1.9972e+00,
         -1.5479e-01],
        [-2.7998e+00, -2.1297e+00, -1.5092e+00, -5.3778e-01,  2.8432e+00,
          3.9849e-01],
        [ 1.0212e+00,  7.0326e-01, -7.7289e-01, -1.2480e+00, -1.0176e-01,
          1.3285e+00],
        [ 2.1208e+00, -3.4439e-01,  2.5993e+00,  2.8504e-01, -1.0434e+00,
          2.1384e-01],
        [ 2.0447e+00,  2.7285e-01,  3.0123e+00, -1.4076e-01, -1.0098e+00,
         -9.1513e-01],
        [ 1.8676e+00,  5.2062e-01,  1.4475e+00,  4.5735e-04, -2.0762e+00,
         -1.4192e+00],
        [ 2.2007e+00,  2.4672e-01, -9.7856e-01,  4.7886e-01, -1.4852e+00,
         -2.1397e+00],
        [-2.1649e+00, -2.3296e+00, -1.5451e+00,  1.9749e-01,  1.8377e+00,
          2.9556e-01],
        [-2.1020e+00, -3.1080e+00, -1.7103e+00, -8.2866e-01,  1.9857e+00,
          2.1864e+00],
        [ 1.4090e+00,  4.2393e-01, -9.9902e-01, -9.3303e-02,  9.5308e-01,
          2.1090e-01],
        [ 2.4518e+00, -1.3608e-01,  2.1475e+00,  9.4909e-01, -1.6646e+00,
         -4.2265e-01]], device='cuda:0')
action: tensor([[ 0.9687, -0.2190, -0.9279,  0.9843, -0.9821, -0.2446],
        [-0.9779, -0.9875, -0.9853,  0.9718,  0.9886,  0.9926],
        [-0.9839, -0.9886, -0.8340, -0.4793,  0.9153,  0.6465],
        [ 0.8364,  0.5786, -0.9297,  0.3112,  0.2688,  0.7786],
        [ 0.9807, -0.3742,  0.9826,  0.1186, -0.8391, -0.7751],
        [ 0.9754, -0.6035,  0.9380,  0.4569, -0.9126, -0.6918],
        [ 0.9748,  0.0182, -0.3172,  0.9131, -0.9635, -0.6384],
        [-0.9761, -0.9408, -0.8796,  0.6037,  0.9644,  0.6974],
        [-0.9026, -0.9954, -0.9555, -0.6704,  0.9822,  0.3139],
        [ 0.8671, -0.0492, -0.6195,  0.1976,  0.9429,  0.9349],
        [ 0.9865, -0.0235,  0.9942,  0.4394, -0.9621, -0.9711],
        [ 0.9630,  0.4062,  0.9903,  0.4527, -0.9945, -0.9240],
        [ 0.9886,  0.1998, -0.8926,  0.9574, -0.9851,  0.8857],
        [-0.9868, -0.9724, -0.9466,  0.9497,  0.9903,  0.9482],
        [-0.9807, -0.8310, -0.9889, -0.1090,  0.8976,  0.6086],
        [ 0.5735,  0.8237, -0.9223, -0.0798,  0.8425, -0.1173],
        [ 0.8878, -0.1889,  0.9899,  0.6359, -0.1607,  0.8654],
        [ 0.9764, -0.5879,  0.9020,  0.5071, -0.6572, -0.8619],
        [ 0.9978, -0.3966,  0.9632,  0.8301, -0.7145, -0.6896],
        [ 0.9427, -0.5053, -0.8357,  0.6078, -0.9794, -0.9731]],
       device='cuda:0')
squash tensor([[ 2.0702, -0.2226, -1.6434,  2.4182, -2.3547, -0.2496],
        [-2.2477, -2.5325, -2.4533,  2.1239,  2.5823,  2.7998],
        [-2.4056, -2.5819, -1.2010, -0.5220,  1.5590,  0.7693],
        [ 1.2091,  0.6604, -1.6562,  0.3218,  0.2756,  1.0418],
        [ 2.3152, -0.3933,  2.3684,  0.1192, -1.2180, -1.0330],
        [ 2.1928, -0.6986,  1.7215,  0.4934, -1.5432, -0.8514],
        [ 2.1801,  0.0182, -0.3285,  1.5457, -1.9921, -0.7555],
        [-2.2073, -1.7451, -1.3739,  0.6990,  2.0060,  0.8623],
        [-1.4860, -3.0416, -1.8916, -0.8114,  2.3571,  0.3248],
        [ 1.3214, -0.0492, -0.7241,  0.2002,  1.7638,  1.6958],
        [ 2.4969, -0.0235,  2.9164,  0.4715, -1.9732, -2.1115],
        [ 1.9856,  0.4311,  2.6610,  0.4881, -2.9486, -1.6158],
        [ 2.5823,  0.2025, -1.4345,  1.9139, -2.4465,  1.4015],
        [-2.5061, -2.1348, -1.7984,  1.8291,  2.6603,  1.8138],
        [-2.3157, -1.1914, -2.5958, -0.1094,  1.4596,  0.7067],
        [ 0.6527,  1.1683, -1.6041, -0.0799,  1.2298, -0.1178],
        [ 1.4114, -0.1912,  2.6404,  0.7512, -0.1621,  1.3145],
        [ 2.2146, -0.6745,  1.4828,  0.5588, -0.7878, -1.3008],
        [ 3.4077, -0.4197,  1.9879,  1.1885, -0.8962, -0.8472],
        [ 1.7621, -0.5564, -1.2067,  0.7054, -2.2819, -2.1481]],
       device='cuda:0')
action: tensor([[ 6.5127e-01,  9.4772e-01, -9.4826e-01, -7.7039e-01,  2.1877e-02,
          8.8598e-01],
        [ 9.8298e-01,  6.4249e-01,  9.8350e-01,  9.4170e-02, -3.0112e-01,
          6.7229e-01],
        [-5.9176e-01, -4.0967e-01, -5.3548e-01,  6.3800e-01,  2.2466e-01,
          6.2618e-01],
        [-9.7973e-01,  9.4008e-01, -8.5059e-01, -9.6041e-01, -9.4557e-01,
          7.3465e-01],
        [ 9.4823e-01,  9.8381e-01, -6.8986e-01, -9.1022e-01, -6.2171e-01,
         -6.4971e-01],
        [ 9.9216e-01, -8.8566e-01,  8.9040e-01, -9.4793e-01, -8.4263e-01,
         -8.3133e-01],
        [ 9.6722e-01, -6.9778e-02, -7.6154e-01,  7.0262e-01, -9.7687e-01,
         -6.1848e-01],
        [-9.7762e-01, -9.5013e-01, -9.4787e-01,  8.4172e-01,  9.2863e-01,
          9.0905e-01],
        [-9.5645e-01, -9.9560e-01, -9.9422e-01, -9.5992e-01,  9.8554e-01,
          9.8901e-01],
        [ 7.9835e-01, -1.0752e-03,  3.3834e-01,  9.3193e-01,  8.0222e-01,
         -2.4881e-01],
        [ 9.2215e-01,  7.7753e-01,  9.6732e-01,  7.8023e-01, -9.8904e-01,
         -8.6850e-01],
        [ 9.7391e-01,  6.3264e-01,  7.8881e-01,  9.5840e-01, -9.6594e-01,
         -8.8443e-01],
        [ 9.1680e-01, -1.3271e-02, -9.5981e-01,  9.4985e-01, -5.8675e-01,
         -2.6974e-01],
        [-9.9260e-01, -9.8362e-01, -9.6214e-01,  9.9207e-01,  9.7486e-01,
          6.4821e-01],
        [-9.8136e-01, -9.3483e-01, -9.3569e-01,  6.8897e-02,  5.1456e-01,
          3.9351e-01],
        [ 6.8799e-01,  6.9836e-01, -8.9797e-01, -7.0153e-01, -1.8856e-01,
         -3.4877e-01],
        [ 9.8569e-01,  4.2059e-01,  9.9827e-01,  7.1099e-01, -8.1535e-01,
          5.3071e-01],
        [-7.9460e-01,  2.9856e-02, -3.5955e-01,  4.1914e-01,  5.6774e-04,
          9.1984e-01],
        [-9.5421e-01,  9.8671e-01, -9.3183e-01, -6.5756e-01, -8.6191e-01,
          6.7542e-01],
        [ 9.6700e-01,  9.8276e-01, -9.2102e-01, -8.6019e-01, -7.5416e-01,
         -6.7782e-01]], device='cuda:0')
squash tensor([[ 7.7749e-01,  1.8089e+00, -1.8142e+00, -1.0213e+00,  2.1880e-02,
          1.4029e+00],
        [ 2.3788e+00,  7.6241e-01,  2.3945e+00,  9.4450e-02, -3.1075e-01,
          8.1491e-01],
        [-6.8037e-01, -4.3522e-01, -5.9780e-01,  7.5480e-01,  2.2856e-01,
          7.3511e-01],
        [-2.2908e+00,  1.7388e+00, -1.2583e+00, -1.9512e+00, -1.7882e+00,
          9.3875e-01],
        [ 1.8139e+00,  2.4043e+00, -8.4768e-01, -1.5288e+00, -7.2779e-01,
         -7.7479e-01],
        [ 2.7689e+00, -1.4014e+00,  1.4239e+00, -1.8109e+00, -1.2302e+00,
         -1.1924e+00],
        [ 2.0473e+00, -6.9891e-02, -9.9987e-01,  8.7245e-01, -2.2240e+00,
         -7.2254e-01],
        [-2.2408e+00, -1.8331e+00, -1.8104e+00,  1.2271e+00,  1.6483e+00,
          1.5220e+00],
        [-1.9025e+00, -3.0590e+00, -2.9218e+00, -1.9449e+00,  2.4612e+00,
          2.5992e+00],
        [ 1.0941e+00, -1.0752e-03,  3.5221e-01,  1.6729e+00,  1.1048e+00,
         -2.5414e-01],
        [ 1.6032e+00,  1.0391e+00,  2.0488e+00,  1.0460e+00, -2.6004e+00,
         -1.3269e+00],
        [ 2.1631e+00,  7.4581e-01,  1.0683e+00,  1.9259e+00, -2.0278e+00,
         -1.3957e+00],
        [ 1.5686e+00, -1.3272e-02, -1.9434e+00,  1.8302e+00, -6.7269e-01,
         -2.7659e-01],
        [-2.7981e+00, -2.3982e+00, -1.9739e+00,  2.7630e+00,  2.1818e+00,
          7.7221e-01],
        [-2.3330e+00, -1.6954e+00, -1.7022e+00,  6.9006e-02,  5.6891e-01,
          4.1594e-01],
        [ 8.4413e-01,  8.6409e-01, -1.4617e+00, -8.7032e-01, -1.9085e-01,
         -3.6405e-01],
        [ 2.4663e+00,  4.4841e-01,  3.5270e+00,  8.8919e-01, -1.1428e+00,
          5.9114e-01],
        [-1.0838e+00,  2.9864e-02, -3.7637e-01,  4.4665e-01,  5.6774e-04,
          1.5880e+00],
        [-1.8768e+00,  2.5035e+00, -1.6721e+00, -7.8851e-01, -1.3007e+00,
          8.2065e-01],
        [ 2.0439e+00,  2.3725e+00, -1.5957e+00, -1.2941e+00, -9.8254e-01,
         -8.2507e-01]], device='cuda:0')
action: tensor([[ 0.9386,  0.3528,  0.9923,  0.5088, -0.8745, -0.6362],
        [ 0.9835, -0.1092,  0.9351,  0.3141, -0.9668, -0.7636],
        [ 0.9912,  0.7333,  0.6756,  0.7155, -0.9633, -0.4204],
        [-0.9522, -0.8446, -0.8847,  0.8829,  0.9132,  0.6775],
        [-0.9931, -0.9821, -0.9311, -0.0466,  0.9104,  0.9839],
        [ 0.9796,  0.2346, -0.4134,  0.7694,  0.8290,  0.2561],
        [ 0.9883, -0.0737,  0.9611,  0.0113, -0.9710,  0.0109],
        [ 0.1579, -0.1535,  0.2335,  0.7488, -0.8196,  0.4494],
        [-0.9045,  0.5746, -0.9885, -0.9152, -0.2028,  0.4268],
        [ 0.6028,  0.6594, -0.9782, -0.9917, -0.8170, -0.9517],
        [ 0.9851, -0.5424,  0.9611, -0.9665, -0.9688, -0.9687],
        [ 0.7221, -0.3039, -0.9546,  0.8944, -0.6554, -0.6252],
        [-0.9805, -0.8134, -0.9927,  0.0923,  0.9547,  0.9320],
        [-0.6219, -0.9517, -0.9877,  0.0845,  0.6579,  0.2693],
        [ 0.6057,  0.6910, -0.8321,  0.6187,  0.8859,  0.4751],
        [ 0.8905,  0.0574,  0.9963,  0.5775, -0.9084,  0.2453],
        [ 0.9362, -0.1490,  0.9667,  0.0076, -0.9676, -0.5333],
        [ 0.9925,  0.2353,  0.7922,  0.8320, -0.9878, -0.9411],
        [ 0.8027,  0.0519, -0.5400,  0.5142, -0.8422, -0.9442],
        [-0.9687, -0.9922, -0.9605,  0.5347,  0.9544,  0.5549]],
       device='cuda:0')
squash tensor([[ 1.7263,  0.3687,  2.7757,  0.5611, -1.3519, -0.7517],
        [ 2.3940, -0.1096,  1.6972,  0.3251, -2.0407, -1.0048],
        [ 2.7096,  0.9358,  0.8210,  0.8983, -1.9895, -0.4481],
        [-1.8544, -1.2370, -1.3971,  1.3888,  1.5464,  0.8245],
        [-2.8304, -2.3536, -1.6669, -0.0466,  1.5296,  2.4082],
        [ 2.2886,  0.2391, -0.4397,  1.0190,  1.1850,  0.2619],
        [ 2.5690, -0.0739,  1.9595,  0.0113, -2.1101,  0.0109],
        [ 0.1592, -0.1547,  0.2378,  0.9703, -1.1556,  0.4839],
        [-1.4966,  0.6543, -2.5766, -1.5583, -0.2057,  0.4560],
        [ 0.6975,  0.7918, -2.2540, -2.7389, -1.1478, -1.8499],
        [ 2.4446, -0.6076,  1.9596, -2.0365, -2.0718, -2.0700],
        [ 0.9120, -0.3138, -1.8808,  1.4435, -0.7848, -0.7335],
        [-2.3100, -1.1371, -2.8045,  0.0925,  1.8818,  1.6732],
        [-0.7281, -1.8493, -2.5425,  0.0847,  0.7891,  0.2761],
        [ 0.7022,  0.8498, -1.1950,  0.7228,  1.4027,  0.5166],
        [ 1.4243,  0.0575,  3.1481,  0.6587, -1.5185,  0.2504],
        [ 1.7060, -0.1501,  2.0389,  0.0076, -2.0529, -0.5947],
        [ 2.7892,  0.2398,  1.0774,  1.1944, -2.5485, -1.7476],
        [ 1.1061,  0.0520, -0.6042,  0.5684, -1.2288, -1.7753],
        [-2.0702, -2.7731, -1.9529,  0.5967,  1.8788,  0.6254]],
       device='cuda:0')
action: tensor([[ 0.9917,  0.0404,  0.9171,  0.5218,  0.3984,  0.7564],
        [ 0.9537,  0.6773,  0.9209, -0.1470, -0.9476, -0.9508],
        [ 0.9342,  0.0280, -0.6401,  0.1373, -0.8810, -0.6785],
        [-0.9949, -0.9922, -0.9196,  0.3456,  0.9361, -0.8993],
        [-0.9897, -0.9821, -0.9349, -0.9248,  0.9758,  0.6693],
        [-0.5563,  0.9893, -0.8519, -0.9707,  0.3866, -0.6506],
        [ 0.9848, -0.6730,  0.9899, -0.3359, -0.9668, -0.9861],
        [ 0.9845,  0.2984,  0.9677,  0.1408, -0.9778, -0.9698],
        [ 0.7092, -0.3010, -0.9703,  0.9208, -0.1408, -0.0467],
        [-0.9887, -0.9831, -0.9688,  0.9807,  0.9754,  0.9678],
        [-0.9187, -0.7301, -0.8073,  0.1246,  0.9250,  0.2460],
        [ 0.8089,  0.5325, -0.8275, -0.4685,  0.2318,  0.7342],
        [ 0.8905, -0.0708,  0.9441,  0.6520, -0.0274,  0.8059],
        [-0.9620,  0.8048, -0.9423,  0.0048, -0.3401,  0.5114],
        [ 0.8048,  0.9852, -0.9864, -0.9309,  0.4530,  0.7710],
        [ 0.9578, -0.5400,  0.9962, -0.9179, -0.9108, -0.9171],
        [ 0.9974,  0.6601, -0.9475,  0.6814, -0.9703, -0.9818],
        [-0.9814, -0.8726, -0.9802,  0.1362,  0.9626,  0.9496],
        [-0.9377, -0.9313, -0.9893, -0.7893,  0.9806,  0.9402],
        [ 0.8752,  0.7299, -0.7725,  0.1445,  0.8480,  0.3700]],
       device='cuda:0')
squash tensor([[ 2.7402,  0.0404,  1.5704,  0.5788,  0.4218,  0.9877],
        [ 1.8715,  0.8242,  1.5952, -0.1481, -1.8075, -1.8402],
        [ 1.6903,  0.0280, -0.7583,  0.1382, -1.3801, -0.8263],
        [-2.9894, -2.7695, -1.5866,  0.3605,  1.7054, -1.4686],
        [-2.6321, -2.3548, -1.6962, -1.6215,  2.2008,  0.8095],
        [-0.6275,  2.6136, -1.2630, -2.1039,  0.4077, -0.7764],
        [ 2.4348, -0.8162,  2.6437, -0.3494, -2.0412, -2.4797],
        [ 2.4265,  0.3078,  2.0555,  0.1418, -2.2452, -2.0886],
        [ 0.8855, -0.3106, -2.0968,  1.5943, -0.1418, -0.0468],
        [-2.5837, -2.3836, -2.0718,  2.3167,  2.1922,  2.0563],
        [-1.5805, -0.9289, -1.1193,  0.1253,  1.6225,  0.2511],
        [ 1.1239,  0.5936, -1.1803, -0.5082,  0.2361,  0.9377],
        [ 1.4242, -0.0709,  1.7743,  0.7788, -0.0274,  1.1154],
        [-1.9721,  1.1121, -1.7577,  0.0048, -0.3542,  0.5646],
        [ 1.1120,  2.4491, -2.4923, -1.6650,  0.4884,  1.0228],
        [ 1.9187, -0.6042,  3.1363, -1.5758, -1.5322, -1.5704],
        [ 3.3178,  0.7930, -1.8064,  0.8317, -2.0977, -2.3439],
        [-2.3348, -1.3437, -2.3022,  0.1371,  1.9803,  1.8274],
        [-1.7188, -1.6678, -2.6135, -1.0696,  2.3117,  1.7399],
        [ 1.3550,  0.9285, -1.0265,  0.1455,  1.2492,  0.3884]],
       device='cuda:0')
action: tensor([[ 9.8999e-01, -4.9408e-01,  9.9163e-01, -9.8263e-01, -8.6520e-01,
         -7.0224e-01],
        [ 9.9630e-01,  3.8427e-01, -6.4166e-01,  2.6776e-01, -9.9559e-01,
         -9.6889e-01],
        [-9.7189e-01, -9.7713e-01, -8.8413e-01,  2.9207e-01,  9.7882e-01,
          8.1661e-01],
        [-9.7980e-01, -9.9410e-01, -9.7383e-01, -3.6024e-01,  9.2834e-01,
          1.8689e-01],
        [ 7.8596e-01,  5.7710e-01, -7.6949e-01,  3.9562e-02,  6.3769e-01,
         -3.1119e-01],
        [ 9.9673e-01, -2.5240e-01,  9.9040e-01, -3.8773e-01, -9.0776e-01,
          1.3117e-01],
        [ 9.6752e-01, -4.4533e-01,  9.8101e-01, -2.6692e-02, -8.4191e-01,
         -7.0436e-01],
        [ 9.8612e-01,  8.3057e-02,  7.4018e-01,  9.0371e-01, -9.6001e-01,
         -7.5224e-01],
        [ 9.6807e-01, -1.3316e-01, -5.5015e-01,  4.1526e-01, -9.0563e-01,
         -9.7927e-01],
        [-9.9698e-01, -9.8235e-01, -9.5367e-01,  5.2823e-01,  9.9450e-01,
         -1.1662e-01],
        [-9.5012e-01, -9.7093e-01, -9.3012e-01, -7.7744e-01,  8.8060e-01,
          4.7258e-01],
        [-3.2914e-02,  6.8173e-01, -9.4223e-01, -4.0446e-01, -7.6529e-02,
         -6.2150e-01],
        [ 9.6168e-01,  2.4048e-02,  9.9089e-01,  8.1052e-01, -9.5271e-01,
         -7.9732e-01],
        [ 9.9688e-01,  6.9408e-01,  9.1196e-01,  2.4141e-01, -9.1124e-01,
          7.7711e-01],
        [ 9.8024e-01,  1.0302e-01, -9.3123e-01,  9.0908e-01, -9.5230e-01,
          2.2035e-01],
        [-9.9550e-01, -9.8679e-01, -7.5420e-01,  7.9574e-01,  9.0190e-01,
          6.4938e-01],
        [-9.8887e-01, -9.5333e-01, -9.5073e-01, -4.9387e-01,  9.7947e-01,
          9.5286e-01],
        [ 7.7783e-01,  8.6795e-01, -9.0731e-01, -1.3269e-01,  3.3032e-01,
          6.9190e-01],
        [ 9.5884e-01, -7.6816e-01,  9.9568e-01,  6.1389e-01, -8.5655e-01,
         -9.0143e-04],
        [ 9.8860e-01,  5.1274e-01,  7.6709e-01, -3.4473e-02, -9.1651e-01,
         -3.8047e-01]], device='cuda:0')
squash tensor([[ 2.6461e+00, -5.4145e-01,  2.7357e+00, -2.3686e+00, -1.3137e+00,
         -8.7171e-01],
        [ 3.1454e+00,  4.0505e-01, -7.6100e-01,  2.7445e-01, -3.0569e+00,
         -2.0739e+00],
        [-2.1254e+00, -2.2298e+00, -1.3944e+00,  3.0082e-01,  2.2685e+00,
          1.1465e+00],
        [-2.2926e+00, -2.9115e+00, -2.1616e+00, -3.7716e-01,  1.6462e+00,
          1.8911e-01],
        [ 1.0608e+00,  6.5810e-01, -1.0191e+00,  3.9582e-02,  7.5427e-01,
         -3.2187e-01],
        [ 3.2075e+00, -2.5797e-01,  2.6672e+00, -4.0912e-01, -1.5147e+00,
          1.3193e-01],
        [ 2.0519e+00, -4.7886e-01,  2.3238e+00, -2.6698e-02, -1.2277e+00,
         -8.7590e-01],
        [ 2.4817e+00,  8.3248e-02,  9.5088e-01,  1.4921e+00, -1.9460e+00,
         -9.7809e-01],
        [ 2.0606e+00, -1.3395e-01, -6.1859e-01,  4.4195e-01, -1.5027e+00,
         -2.2794e+00],
        [-3.2478e+00, -2.3606e+00, -1.8708e+00,  5.8768e-01,  2.9464e+00,
         -1.1715e-01],
        [-1.8330e+00, -2.1083e+00, -1.6593e+00, -1.0389e+00,  1.3784e+00,
          5.1339e-01],
        [-3.2926e-02,  8.3233e-01, -1.7576e+00, -4.2897e-01, -7.6679e-02,
         -7.2744e-01],
        [ 1.9678e+00,  2.4053e-02,  2.6933e+00,  1.1285e+00, -1.8603e+00,
         -1.0912e+00],
        [ 3.2313e+00,  8.5579e-01,  1.5390e+00,  2.4627e-01, -1.5348e+00,
          1.0380e+00],
        [ 2.3037e+00,  1.0339e-01, -1.6676e+00,  1.5222e+00, -1.8559e+00,
          2.2402e-01],
        [-3.0468e+00, -2.5068e+00, -9.8262e-01,  1.0869e+00,  1.4823e+00,
          7.7422e-01],
        [-2.5926e+00, -1.8671e+00, -1.8393e+00, -5.4117e-01,  2.2843e+00,
          1.8620e+00],
        [ 1.0399e+00,  1.3247e+00, -1.5121e+00, -1.3348e-01,  3.4319e-01,
          8.5159e-01],
        [ 1.9314e+00, -1.0158e+00,  3.0674e+00,  7.1514e-01, -1.2802e+00,
         -9.0143e-04],
        [ 2.5809e+00,  5.6645e-01,  1.0132e+00, -3.4487e-02, -1.5667e+00,
         -4.0061e-01]], device='cuda:0')
action: tensor([[-0.9616, -0.9564, -0.9748,  0.5252,  0.9928,  0.7625],
        [-0.9402, -0.9801, -0.9665, -0.3488,  0.9763,  0.9858],
        [ 0.9169,  0.4747, -0.8117,  0.4485,  0.7745,  0.7960],
        [ 0.9640, -0.4271,  0.9580,  0.2756, -0.9320, -0.7548],
        [ 0.9660, -0.4319,  0.9895, -0.0011, -0.8695, -0.7762],
        [ 0.9975,  0.1131,  0.8827,  0.7220, -0.9696, -0.9109],
        [ 0.6441,  0.0118, -0.7665,  0.2495, -0.9717, -0.9887],
        [-0.9846, -0.9885, -0.9725,  0.8204,  0.9571,  0.7540],
        [-0.9344, -0.9726, -0.9692, -0.8782,  0.9686,  0.8791],
        [ 0.2814,  0.7175, -0.9634, -0.1055, -0.2955,  0.0749],
        [ 0.9726,  0.4635,  0.9185,  0.6927, -0.8886, -0.6083],
        [ 0.9592,  0.6862,  0.9861,  0.1952, -0.9735,  0.0737],
        [ 0.9747,  0.2417, -0.5899,  0.8356, -0.8725, -0.9114],
        [-0.9953, -0.8557, -0.9420,  0.6299,  0.9112,  0.7880],
        [-0.8865, -0.9748, -0.9623, -0.6667,  0.5480,  0.7237],
        [ 0.8852,  0.6343, -0.9871, -0.5017,  0.8104,  0.2312],
        [ 0.9928, -0.8833,  0.9842,  0.3179, -0.5363,  0.2989],
        [ 0.9152, -0.3733,  0.9485,  0.7747, -0.8352, -0.3554],
        [ 0.8644, -0.9578, -0.5479,  0.8956, -0.7808, -0.7645],
        [-0.9952, -0.9508, -0.9496,  0.8353,  0.9576, -0.8084]],
       device='cuda:0')
squash tensor([[-1.9662e+00, -1.9021e+00, -2.1810e+00,  5.8353e-01,  2.8105e+00,
          1.0021e+00],
        [-1.7396e+00, -2.2999e+00, -2.0357e+00, -3.6407e-01,  2.2124e+00,
          2.4691e+00],
        [ 1.5695e+00,  5.1610e-01, -1.1320e+00,  4.8288e-01,  1.0314e+00,
          1.0876e+00],
        [ 2.0000e+00, -4.5631e-01,  1.9212e+00,  2.8293e-01, -1.6731e+00,
         -9.8395e-01],
        [ 2.0281e+00, -4.6225e-01,  2.6203e+00, -1.0646e-03, -1.3311e+00,
         -1.0357e+00],
        [ 3.3508e+00,  1.1360e-01,  1.3879e+00,  9.1181e-01, -2.0855e+00,
         -1.5330e+00],
        [ 7.6519e-01,  1.1778e-02, -1.0119e+00,  2.5486e-01, -2.1211e+00,
         -2.5859e+00],
        [-2.4296e+00, -2.5783e+00, -2.1362e+00,  1.1580e+00,  1.9101e+00,
          9.8205e-01],
        [-1.6917e+00, -2.1391e+00, -2.0784e+00, -1.3677e+00,  2.0698e+00,
          1.3717e+00],
        [ 2.8915e-01,  9.0237e-01, -1.9910e+00, -1.0588e-01, -3.0460e-01,
          7.5006e-02],
        [ 2.1374e+00,  5.0179e-01,  1.5796e+00,  8.5305e-01, -1.4152e+00,
         -7.0622e-01],
        [ 1.9353e+00,  8.4075e-01,  2.4806e+00,  1.9772e-01, -2.1555e+00,
          7.3877e-02],
        [ 2.1788e+00,  2.4659e-01, -6.7751e-01,  1.2063e+00, -1.3437e+00,
         -1.5355e+00],
        [-3.0255e+00, -1.2771e+00, -1.7557e+00,  7.4117e-01,  1.5345e+00,
          1.0661e+00],
        [-1.4053e+00, -2.1800e+00, -1.9767e+00, -8.0473e-01,  6.1545e-01,
          9.1534e-01],
        [ 1.3991e+00,  7.4861e-01, -2.5192e+00, -5.5158e-01,  1.1282e+00,
          2.3550e-01],
        [ 2.8147e+00, -1.3906e+00,  2.4165e+00,  3.2927e-01, -5.9893e-01,
          3.0829e-01],
        [ 1.5584e+00, -3.9224e-01,  1.8171e+00,  1.0319e+00, -1.2052e+00,
         -3.7161e-01],
        [ 1.3106e+00, -1.9186e+00, -6.1543e-01,  1.4496e+00, -1.0475e+00,
         -1.0070e+00],
        [-3.0132e+00, -1.8405e+00, -1.8275e+00,  1.2055e+00,  1.9161e+00,
         -1.1223e+00]], device='cuda:0')
action: tensor([[ 0.9859, -0.1495, -0.9387,  0.9756, -0.9487,  0.4271],
        [-0.9914, -0.9613, -0.9200,  0.9071,  0.9557,  0.8875],
        [-0.9942, -0.9874, -0.9460, -0.1933,  0.1951,  0.5651],
        [ 0.2424,  0.6980, -0.9554, -0.7473,  0.0935,  0.1305],
        [ 0.9875,  0.2215,  0.9241,  0.7434, -0.8427,  0.1339],
        [ 0.9935,  0.3653,  0.9625,  0.1077, -0.7018, -0.7875],
        [ 0.9734,  0.3868,  0.9883, -0.0098, -0.9616, -0.7895],
        [ 0.9877, -0.1320, -0.5962,  0.2531, -0.9384, -0.9611],
        [-0.9768, -0.9464, -0.8849,  0.1054,  0.9657, -0.9171],
        [-0.9609, -0.9746, -0.9693, -0.5113,  0.9830,  0.9427],
        [ 0.9239,  0.6298, -0.8286, -0.7957,  0.8516,  0.7019],
        [ 0.9609, -0.2255,  0.9635,  0.0836, -0.9391, -0.3891],
        [ 0.9694,  0.1389,  0.9272,  0.7578, -0.9500,  0.2421],
        [ 0.9356, -0.4162,  0.1192,  0.9717, -0.9779,  0.8589],
        [-0.9932, -0.9413, -0.9399,  0.6588,  0.9542, -0.0218],
        [-0.9885, -0.9777, -0.9516, -0.4093,  0.9389,  0.8889],
        [ 0.8425,  0.3710, -0.2425, -0.0097,  0.3649,  0.8197],
        [ 0.9286, -0.1676,  0.9492,  0.5794, -0.9708, -0.9137],
        [ 0.9617,  0.7336,  0.9669,  0.7140, -0.8695, -0.7188],
        [ 0.9919,  0.2443, -0.9671,  0.9698, -0.5539,  0.8855]],
       device='cuda:0')
squash tensor([[ 2.4727, -0.1507, -1.7268,  2.1971, -1.8183,  0.4563],
        [-2.7198, -1.9630, -1.5893,  1.5107,  1.8935,  1.4102],
        [-2.9171, -2.5307, -1.7922, -0.1957,  0.1976,  0.6403],
        [ 0.2473,  0.8633, -1.8898, -0.9668,  0.0937,  0.1313],
        [ 2.5331,  0.2252,  1.6164,  0.9581, -1.2304,  0.1347],
        [ 2.8600,  0.3830,  1.9785,  0.1081, -0.8708, -1.0648],
        [ 2.1528,  0.4081,  2.5686, -0.0098, -1.9669, -1.0702],
        [ 2.5424, -0.1328, -0.6872,  0.2587, -1.7243, -1.9595],
        [-2.2222, -1.7961, -1.3979,  0.1058,  2.0236, -1.5704],
        [-1.9577, -2.1772, -2.0813, -0.5645,  2.3803,  1.7618],
        [ 1.6151,  0.7411, -1.1835, -1.0868,  1.2618,  0.8711],
        [ 1.9579, -0.2294,  1.9930,  0.0837, -1.7305, -0.4107],
        [ 2.0822,  0.1398,  1.6380,  0.9910, -1.8323,  0.2470],
        [ 1.7012, -0.4431,  0.1197,  2.1227, -2.2465,  1.2890],
        [-2.8373, -1.7495, -1.7372,  0.7907,  1.8769, -0.0218],
        [-2.5780, -2.2427, -1.8482, -0.4348,  1.7291,  1.4168],
        [ 1.2299,  0.3896, -0.2474, -0.0097,  0.3826,  1.1558],
        [ 1.6481, -0.1692,  1.8239,  0.6616, -2.1064, -1.5492],
        [ 1.9685,  0.9365,  2.0425,  0.8953, -1.3309, -0.9052],
        [ 2.7547,  0.2494, -2.0452,  2.0885, -0.6239,  1.4006]],
       device='cuda:0')
action: tensor([[ 0.9985, -0.3619,  0.9931,  0.5008, -0.5471,  0.8936],
        [ 0.9632, -0.6731,  0.9937,  0.4782, -0.8386, -0.1232],
        [ 0.3980, -0.9369, -0.6837,  0.9824, -0.6569, -0.9463],
        [-0.9903, -0.9970, -0.9801,  0.5291,  0.8403, -0.6932],
        [-0.9011, -0.9900, -0.7878, -0.8923,  0.8028,  0.6016],
        [ 0.6042,  0.8477,  0.0351, -0.5945, -0.4988, -0.3035],
        [ 0.9940,  0.1905,  0.9317,  0.3033, -0.9592, -0.8750],
        [ 0.9911,  0.8001,  0.9654,  0.6989, -0.9460, -0.5362],
        [ 0.9919,  0.0738, -0.7125,  0.9049, -0.9214,  0.2169],
        [-0.9983, -0.9537, -0.9240,  0.9767,  0.9879,  0.9653],
        [-0.9861, -0.9135, -0.9772,  0.0681,  0.7532,  0.6425],
        [ 0.9535,  0.3311, -0.9360, -0.0117,  0.4843,  0.5486],
        [ 0.9679,  0.6647,  0.9641,  0.6885, -0.5728, -0.1760],
        [-0.9384,  0.9794, -0.9834,  0.1348, -0.1910,  0.8299],
        [ 0.9510,  0.7394, -0.9096, -0.8443, -0.3471,  0.0903],
        [ 0.9976, -0.4773,  0.9827, -0.9785, -0.9603, -0.9732],
        [ 0.9944,  0.6238, -0.8311,  0.3830, -0.9409, -0.7983],
        [-0.9877, -0.8996, -0.9609,  0.5991,  0.9406,  0.9416],
        [-0.9783, -0.9584, -0.9826, -0.8665,  0.9742,  0.9561],
        [ 0.8259,  0.8014, -0.8061,  0.2215,  0.9032,  0.3782]],
       device='cuda:0')
squash tensor([[ 3.6008, -0.3790,  2.8311,  0.5504, -0.6143,  1.4394],
        [ 1.9877, -0.8164,  2.8747,  0.5206, -1.2164, -0.1239],
        [ 0.4212, -1.7117, -0.8361,  2.3608, -0.7874, -1.7953],
        [-2.6638, -3.2534, -2.3006,  0.5889,  1.2223, -0.8541],
        [-1.4778, -2.6461, -1.0657, -1.4331,  1.1065,  0.6957],
        [ 0.6998,  1.2478,  0.0352, -0.6847, -0.5477, -0.3133],
        [ 2.9009,  0.1929,  1.6708,  0.3132, -1.9362, -1.3539],
        [ 2.7037,  1.0988,  2.0191,  0.8651, -1.7919, -0.5988],
        [ 2.7513,  0.0739, -0.8923,  1.4986, -1.5983,  0.2203],
        [-3.5272, -1.8716, -1.6154,  2.2203,  2.5517,  2.0180],
        [-2.4822, -1.5483, -2.2323,  0.0682,  0.9803,  0.7624],
        [ 1.8695,  0.3440, -1.7045, -0.0117,  0.5286,  0.6164],
        [ 2.0583,  0.8012,  2.0007,  0.8452, -0.6516, -0.1778],
        [-1.7246,  2.2831, -2.3930,  0.1357, -0.1934,  1.1877],
        [ 1.8423,  0.9491, -1.5249, -1.2359, -0.3621,  0.0905],
        [ 3.3622, -0.5195,  2.3699, -2.2620, -1.9492, -2.1503],
        [ 2.9400,  0.7312, -1.1916,  0.4036, -1.7459, -1.0939],
        [-2.5413, -1.4699, -1.9569,  0.6918,  1.7433,  1.7520],
        [-2.2562, -1.9257, -2.3665, -1.3190,  2.1692,  1.8988],
        [ 1.1752,  1.1025, -1.1157,  0.2252,  1.4893,  0.3980]],
       device='cuda:0')
action: tensor([[-0.9534, -0.9887, -0.8014, -0.2822,  0.9739,  0.7012],
        [ 0.8513,  0.4005, -0.6913, -0.0803,  0.7011,  0.5865],
        [ 0.9605, -0.3662,  0.9968,  0.3762, -0.9362, -0.4315],
        [ 0.9944, -0.5292,  0.9374,  0.7812, -0.9421, -0.2552],
        [ 0.6487, -0.8766, -0.8307,  0.9848, -0.7747, -0.6062],
        [-0.9814, -0.9675, -0.8890,  0.9897,  0.9393,  0.7716],
        [-0.9617, -0.9805, -0.9926, -0.3401,  0.9557,  0.6054],
        [ 0.0924,  0.7647, -0.9979, -0.9018,  0.3099,  0.6227],
        [ 0.8854,  0.6670,  0.9845,  0.6486, -0.0804, -0.9210],
        [-0.9948,  0.9352, -0.8258, -0.5611, -0.3923,  0.1334],
        [ 0.4043,  0.9229, -0.9630, -0.8839, -0.2907, -0.1381],
        [ 0.9851, -0.6116,  0.9547, -0.9877, -0.9754, -0.9509],
        [ 0.9969,  0.7116, -0.7433, -0.0143, -0.9790, -0.9619],
        [-0.9824, -0.9356, -0.9670,  0.8492,  0.9560,  0.9817],
        [-0.9867, -0.9899, -0.9233, -0.9125,  0.9273,  0.8838],
        [ 0.8243,  0.3190,  0.1903,  0.8985,  0.9340,  0.3257],
        [ 0.9785, -0.3301,  0.9795, -0.0425, -0.7790, -0.6744],
        [ 0.9754, -0.3357,  0.9529, -0.4635, -0.9543, -0.8795],
        [ 0.9918,  0.5007,  0.8843,  0.3792, -0.9659, -0.9508],
        [ 0.9786,  0.7380, -0.8976,  0.4355, -0.9910, -0.8066]],
       device='cuda:0')
squash tensor([[-1.8674, -2.5856, -1.1026, -0.2900,  2.1627,  0.8696],
        [ 1.2610,  0.4243, -0.8505, -0.0805,  0.8695,  0.6724],
        [ 1.9525, -0.3840,  3.2179,  0.3956, -1.7067, -0.4617],
        [ 2.9421, -0.5891,  1.7159,  1.0484, -1.7561, -0.2610],
        [ 0.7731, -1.3607, -1.1904,  2.4361, -1.0319, -0.7028],
        [-2.3355, -2.0513, -1.4169,  2.6304,  1.7321,  1.0244],
        [-1.9686, -2.3095, -2.7965, -0.3542,  1.8942,  0.7017],
        [ 0.0927,  1.0075, -3.4372, -1.4818,  0.3205,  0.7294],
        [ 1.4003,  0.8054,  2.4251,  0.7729, -0.0805, -1.5958],
        [-2.9794,  1.6982, -1.1748, -0.6345, -0.4146,  0.1342],
        [ 0.4288,  1.6084, -1.9854, -1.3932, -0.2993, -0.1390],
        [ 2.4466, -0.7114,  1.8824, -2.5425, -2.1934, -1.8413],
        [ 3.2335,  0.8903, -0.9577, -0.0143, -2.2731, -1.9704],
        [-2.3610, -1.7015, -2.0444,  1.2534,  1.8975,  2.3434],
        [-2.5040, -2.6396, -1.6106, -1.5423,  1.6389,  1.3930],
        [ 1.1702,  0.3306,  0.1926,  1.4643,  1.6886,  0.3381],
        [ 2.2609, -0.3430,  2.2840, -0.0425, -1.0429, -0.8187],
        [ 2.1929, -0.3493,  1.8619, -0.5018, -1.8774, -1.3736],
        [ 2.7441,  0.5502,  1.3953,  0.3992, -2.0278, -1.8401],
        [ 2.2633,  0.9460, -1.4597,  0.4666, -2.7009, -1.1173]],
       device='cuda:0')
action: tensor([[-0.9867, -0.7633, -0.9822,  0.9619,  0.9795,  0.9974],
        [-0.9932, -0.9870, -0.9913,  0.0762,  0.9478,  0.9313],
        [ 0.9059,  0.6084, -0.7913, -0.8926,  0.4081, -0.6579],
        [ 0.9797,  0.3140,  0.9841,  0.8866, -0.8980,  0.9810],
        [-0.9979,  0.7932, -0.7803, -0.2761, -0.3978,  0.0912],
        [ 0.8411,  0.8540, -0.9308, -0.7181,  0.3590, -0.2622],
        [ 0.9949, -0.4234,  0.9841, -0.9167, -0.8102, -0.5507],
        [ 0.9996,  0.8100, -0.6514,  0.2284, -0.8560, -0.9812],
        [-0.9647, -0.8000, -0.8878,  0.2942,  0.7347,  0.8867],
        [-0.9755, -0.9399, -0.9753, -0.1634,  0.9861,  0.8149],
        [ 0.9727,  0.3262, -0.4742,  0.3427,  0.3855,  0.4564],
        [ 0.9869, -0.5250,  0.9771,  0.1432, -0.9193, -0.7908],
        [ 0.9950, -0.6918,  0.9985,  0.1947, -0.9247, -0.3818],
        [ 0.9999,  0.1466,  0.8660,  0.6206, -0.9558, -0.9952],
        [ 0.9740, -0.5295, -0.8278,  0.7096, -0.8418, -0.8675],
        [-0.9902, -0.9923, -0.9581,  0.3784,  0.9571,  0.6108],
        [-0.9813, -0.9914, -0.8882, -0.6524,  0.9311,  0.9284],
        [ 0.1169,  0.7707, -0.7015,  0.0811,  0.4238,  0.2944],
        [ 0.9711, -0.1152,  0.9917,  0.3910, -0.4644, -0.8042],
        [ 0.9821,  0.2019,  0.9660, -0.2812, -0.9288, -0.9588]],
       device='cuda:0')
squash tensor([[-2.5044, -1.0041, -2.3564,  1.9701,  2.2841,  3.3206],
        [-2.8400, -2.5129, -2.7182,  0.0764,  1.8097,  1.6680],
        [ 1.5042,  0.7064, -1.0749, -1.4346,  0.4334, -0.7890],
        [ 2.2894,  0.3250,  2.4117,  1.4056, -1.4620,  2.3228],
        [-3.4322,  1.0799, -1.0462, -0.2835, -0.4210,  0.0914],
        [ 1.2250,  1.2709, -1.6645, -0.9037,  0.3757, -0.2684],
        [ 2.9854, -0.4518,  2.4137, -1.5677, -1.1275, -0.6194],
        [ 4.2849,  1.1269, -0.7777,  0.2325, -1.2781, -2.3301],
        [-2.0098, -1.0986, -1.4116,  0.3032,  0.9390,  1.4064],
        [-2.1944, -1.7368, -2.1902, -0.1649,  2.4793,  1.1416],
        [ 2.1406,  0.3386, -0.5155,  0.3572,  0.4065,  0.4927],
        [ 2.5092, -0.5832,  2.2288,  0.1442, -1.5846, -1.0737],
        [ 2.9963, -0.8513,  3.6043,  0.1972, -1.6206, -0.4022],
        [ 4.8729,  0.1477,  1.3170,  0.7260, -1.8945, -3.0141],
        [ 2.1651, -0.5894, -1.1811,  0.8863, -1.2272, -1.3231],
        [-2.6570, -2.7775, -1.9220,  0.3982,  1.9097,  0.7102],
        [-2.3303, -2.7196, -1.4135, -0.7794,  1.6668,  1.6464],
        [ 0.1174,  1.0220, -0.8702,  0.0813,  0.4524,  0.3034],
        [ 2.1111, -0.1158,  2.7394,  0.4130, -0.5029, -1.1104],
        [ 2.3532,  0.2047,  2.0293, -0.2889, -1.6498, -1.9306]],
       device='cuda:0')
action: tensor([[ 0.9944,  0.7314,  0.9814,  0.7351, -0.9303, -0.8757],
        [ 0.4411, -0.5871,  0.8184,  0.9197, -0.8504, -0.8072],
        [-0.5725, -0.2908, -0.8715,  0.9944, -0.9337, -0.9008],
        [-0.9939, -0.9913, -0.8660,  0.9966,  0.8744, -0.2062],
        [-0.9797, -0.8922, -0.8817,  0.5946,  0.9782,  0.8296],
        [ 0.6432,  0.9604, -0.9762, -0.5105,  0.2839, -0.5482],
        [ 0.9387,  0.9398,  0.5952,  0.1817, -0.8835, -0.8599],
        [-0.9760,  0.9376, -0.8282, -0.3017, -0.3162,  0.9535],
        [ 0.7515,  0.8360, -0.9408, -0.7654,  0.3945,  0.3552],
        [ 0.9847, -0.9545,  0.9769, -0.9738, -0.9200, -0.9330],
        [ 0.9242,  0.2242, -0.5974,  0.5468, -0.8998, -0.6349],
        [-0.9956, -0.9804, -0.9951,  0.7021,  0.9782,  0.8717],
        [-0.9723, -0.9601, -0.8172, -0.5615,  0.9907,  0.9338],
        [ 0.9154,  0.2631, -0.4645,  0.8237,  0.7255,  0.2546],
        [ 0.9875, -0.2902,  0.9694,  0.2382, -0.7807, -0.8238],
        [ 0.9756, -0.6205,  0.9344,  0.8064, -0.8116, -0.1330],
        [ 0.4389, -0.8833, -0.5876,  0.8665, -0.9063, -0.4454],
        [-0.9954, -0.8837, -0.8458,  0.9868,  0.9331,  0.2120],
        [-0.9259, -0.9823, -0.9591,  0.0858,  0.9081,  0.8475],
        [-0.0899,  0.8339, -0.9586, -0.8267,  0.2940, -0.1529]],
       device='cuda:0')
squash tensor([[ 2.9384,  0.9317,  2.3342,  0.9397, -1.6609, -1.3569],
        [ 0.4736, -0.6732,  1.1519,  1.5872, -1.2576, -1.1188],
        [-0.6512, -0.2994, -1.3391,  2.9417, -1.6867, -1.4767],
        [-2.8964, -2.7184, -1.3169,  3.1950,  1.3515, -0.2092],
        [-2.2897, -1.4326, -1.3833,  0.6848,  2.2538,  1.1867],
        [ 0.7637,  1.9514, -2.2096, -0.5634,  0.2920, -0.6158],
        [ 1.7270,  1.7365,  0.6857,  0.1837, -1.3917, -1.2929],
        [-2.2053,  1.7180, -1.1823, -0.3114, -0.3274,  1.8693],
        [ 0.9763,  1.2077, -1.7453, -1.0091,  0.4172,  0.3714],
        [ 2.4327, -1.8796,  2.2248, -2.1601, -1.5888, -1.6812],
        [ 1.6171,  0.2281, -0.6892,  0.6139, -1.4709, -0.7495],
        [-3.0564, -2.3076, -2.9995,  0.8715,  2.2544,  1.3402],
        [-2.1335, -1.9476, -1.1483, -0.6350,  2.6820,  1.6873],
        [ 1.5600,  0.2695, -0.5030,  1.1681,  0.9192,  0.2603],
        [ 2.5354, -0.2987,  2.0828,  0.2429, -1.0472, -1.1686],
        [ 2.1968, -0.7259,  1.6923,  1.1167, -1.1317, -0.1337],
        [ 0.4708, -1.3905, -0.6740,  1.3188, -1.5063, -0.4790],
        [-3.0324, -1.3926, -1.2413,  2.5086,  1.6819,  0.2152],
        [-1.6285, -2.3585, -1.9341,  0.0860,  1.5165,  1.2472],
        [-0.0901,  1.2008, -1.9289, -1.1777,  0.3029, -0.1541]],
       device='cuda:0')
action: tensor([[ 0.9828,  0.6715,  0.7411,  0.2915, -0.9507, -0.6236],
        [ 0.8239,  0.3132, -0.9199,  0.7917, -0.9858, -0.4900],
        [-0.9876, -0.9553, -0.9612,  0.7156,  0.9981,  0.9876],
        [-0.9823, -0.8540, -0.9765,  0.1792,  0.9457, -0.0048],
        [ 0.9686,  0.2869, -0.8979, -0.0533,  0.6210, -0.3646],
        [ 0.9888, -0.4651,  0.9805,  0.6864, -0.8868, -0.1902],
        [ 0.9812, -0.1665,  0.9982, -0.1866, -0.9021, -0.1191],
        [ 0.9987,  0.4984,  0.9651,  0.4494, -0.9703, -0.8614],
        [ 0.9344,  0.4666, -0.8792,  0.2143, -0.9467, -0.8626],
        [-0.9971, -0.9118, -0.8779,  0.1911,  0.9867,  0.1366],
        [-0.9649, -0.9939, -0.9562, -0.5342,  0.9754,  0.8926],
        [ 0.9838,  0.4902, -0.9649, -0.5083,  0.5991,  0.5572],
        [ 0.9481, -0.3618,  0.9817,  0.0731, -0.9165,  0.4807],
        [ 0.9665, -0.0318,  0.9881,  0.5618, -0.8906, -0.8630],
        [ 0.6396, -0.3376, -0.5105,  0.9115, -0.9413, -0.9585],
        [-0.9740, -0.8673, -0.8924,  0.4112,  0.9716,  0.2642],
        [-0.9667, -0.9475, -0.9218, -0.3684,  0.9775,  0.3519],
        [ 0.7717, -0.1694, -0.7365,  0.0906,  0.8751,  0.3602],
        [ 0.9865, -0.0228,  0.9926,  0.3649, -0.9351, -0.8978],
        [ 0.9558, -0.3331,  0.9968, -0.1169, -0.9724, -0.7461]],
       device='cuda:0')
squash tensor([[ 2.3733,  0.8134,  0.9529,  0.3002, -1.8392, -0.7308],
        [ 1.1688,  0.3240, -1.5882,  1.0761, -2.4696, -0.5361],
        [-2.5404, -1.8895, -1.9614,  0.8985,  3.4765,  2.5374],
        [-2.3601, -1.2709, -2.2171,  0.1812,  1.7896, -0.0048],
        [ 2.0690,  0.2952, -1.4615, -0.0533,  0.7267, -0.3822],
        [ 2.5895, -0.5038,  2.3093,  0.8412, -1.4066, -0.1925],
        [ 2.3292, -0.1681,  3.5154, -0.1888, -1.4835, -0.1197],
        [ 3.6673,  0.5471,  2.0157,  0.4839, -2.0969, -1.2989],
        [ 1.6918,  0.5057, -1.3721,  0.2176, -1.7987, -1.3034],
        [-3.2741, -1.5380, -1.3666,  0.1935,  2.5026,  0.1375],
        [-2.0124, -2.8936, -1.8997, -0.5960,  2.1923,  1.4344],
        [ 2.4049,  0.5363, -2.0131, -0.5604,  0.6917,  0.6288],
        [ 1.8127, -0.3790,  2.3434,  0.0732, -1.5669,  0.5239],
        [ 2.0368, -0.0318,  2.5578,  0.6354, -1.4250, -1.3050],
        [ 0.7575, -0.3513, -0.5634,  1.5362, -1.7496, -1.9266],
        [-2.1641, -1.3220, -1.4334,  0.4370,  2.1209,  0.2706],
        [-2.0395, -1.8064, -1.6010, -0.3866,  2.2382,  0.3676],
        [ 1.0246, -0.1710, -0.9427,  0.0909,  1.3543,  0.3771],
        [ 2.4958, -0.0228,  2.7950,  0.3826, -1.6976, -1.4608],
        [ 1.8946, -0.3463,  3.2215, -0.1174, -2.1354, -0.9642]],
       device='cuda:0')
action: tensor([[ 0.9600,  0.1015, -0.4321,  0.9041, -0.9810, -0.4358],
        [-0.9871, -0.8619, -0.8568,  0.9634,  0.9936,  0.9790],
        [-0.9981, -0.9536, -0.9436,  0.2319,  0.9504,  0.8784],
        [ 0.9535, -0.0556, -0.9573,  0.5228,  0.8765, -0.2884],
        [ 0.9904,  0.1521,  0.9704,  0.5112, -0.2568,  0.4948],
        [-0.9188, -0.7273, -0.1679,  0.9247, -0.7811, -0.2248],
        [-0.7449,  0.8281, -0.3869, -0.3880, -0.4381,  0.3922],
        [ 0.7097,  0.1784, -0.6573, -0.5929, -0.6197, -0.6505],
        [ 0.9641, -0.7202,  0.8624, -0.9879, -0.9737, -0.9643],
        [ 0.9822, -0.8346, -0.9077,  0.6428, -0.9086, -0.9806],
        [-0.9868, -0.9783, -0.9959,  0.4927,  0.9784,  0.9910],
        [-0.9386, -0.9840, -0.9951, -0.7938,  0.9657,  0.9750],
        [ 0.9289,  0.1530,  0.6622,  0.9230,  0.9174,  0.6951],
        [ 0.8862,  0.7383,  0.8657,  0.5826, -0.9784, -0.9192],
        [ 0.8253, -0.2646,  0.3741,  0.9911, -0.9494,  0.1903],
        [-0.3695, -0.9550, -0.9962,  0.9990, -0.7338,  0.1010],
        [-0.9839, -0.9251, -0.9723,  0.9969,  0.9697,  0.9638],
        [-0.7345,  0.9984, -0.9283, -0.9371, -0.9994, -0.6066],
        [ 0.9836,  0.9786, -0.5478, -0.6946, -0.9669,  0.6149],
        [-0.9562, -0.4873, -0.8957,  0.6431,  0.3718, -0.3090]],
       device='cuda:0')
squash tensor([[ 1.9465,  0.1019, -0.4625,  1.4943, -2.3232, -0.4671],
        [-2.5185, -1.3007, -1.2811,  1.9914,  2.8700,  2.2739],
        [-3.4871, -1.8695, -1.7695,  0.2362,  1.8362,  1.3687],
        [ 1.8691, -0.0556, -1.9120,  0.5802,  1.3605, -0.2968],
        [ 2.6652,  0.1532,  2.0985,  0.5643, -0.2627,  0.5424],
        [-1.5813, -0.9230, -0.1695,  1.6204, -1.0482, -0.2287],
        [-0.9614,  1.1821, -0.4082, -0.4095, -0.4699,  0.4143],
        [ 0.8867,  0.1803, -0.7881, -0.6822, -0.7246, -0.7762],
        [ 2.0009, -0.9080,  1.3024, -2.5516, -2.1597, -2.0035],
        [ 2.3576, -1.2032, -1.5145,  0.7630, -1.5195, -2.3124],
        [-2.5083, -2.2574, -3.0956,  0.5396,  2.2596,  2.6990],
        [-1.7260, -2.4105, -3.0036, -1.0817,  2.0237,  2.1846],
        [ 1.6506,  0.1542,  0.7968,  1.6087,  1.5723,  0.8578],
        [ 1.4038,  0.9467,  1.3155,  0.6665, -2.2597, -1.5837],
        [ 1.1733, -0.2710,  0.3932,  2.7046, -1.8253,  0.1927],
        [-0.3878, -1.8863, -3.1359,  3.7859, -0.9369,  0.1014],
        [-2.4085, -1.6231, -2.1330,  3.2340,  2.0874,  1.9961],
        [-0.9384,  3.5609, -1.6458, -1.7133, -4.0935, -0.7035],
        [ 2.3972,  2.2635, -0.6153, -0.8567, -2.0421,  0.7168],
        [-1.8991, -0.5325, -1.4498,  0.7634,  0.3905, -0.3195]],
       device='cuda:0')
action: tensor([[ 0.9683,  0.3922,  0.9770,  0.4502,  0.3981,  0.6167],
        [-0.9483, -0.5850, -0.3818,  0.4808, -0.5790, -0.2298],
        [-0.9518,  0.9451, -0.9329, -0.8445, -0.1440,  0.7308],
        [ 0.8382,  0.9487, -0.8410, -0.7932, -0.5523, -0.5591],
        [ 0.9808, -0.9532,  0.9854, -0.9905, -0.9103, -0.9723],
        [ 0.9842,  0.5138, -0.8538,  0.6506, -0.9899, -0.6699],
        [-0.9968, -0.9879, -0.9484,  0.7099,  0.9738,  0.9541],
        [-0.9938, -0.9541, -0.9840, -0.9288,  0.9197,  0.9926],
        [ 0.9727,  0.2737,  0.5827,  0.4544, -0.7568, -0.9588],
        [ 0.9496,  0.6020,  0.8492,  0.4726, -0.9911, -0.9769],
        [ 0.9947, -0.1872,  0.9712,  0.1658, -0.9993, -0.9825],
        [ 0.8946,  0.4563, -0.7235,  0.1884, -0.9056, -0.2028],
        [-1.0000, -0.8167, -0.9628,  0.8639,  0.9998,  0.9956],
        [-0.9835, -0.9581, -0.8721,  0.3138,  0.9527,  0.8527],
        [-0.8420, -0.9904, -0.5167,  0.9424,  0.8173,  0.8794],
        [ 0.8138, -0.9034,  0.9101,  0.8905,  0.2882,  0.7655],
        [ 0.9393, -0.7894,  0.8578,  0.5624, -0.9471,  0.9793],
        [-0.9959,  0.9949, -0.9823, -0.9719, -0.7756, -0.7975],
        [ 0.3225,  0.9744, -0.9101, -0.9946, -0.8046, -0.8071],
        [ 0.9979, -0.5939,  0.9503, -0.9928, -0.9628, -0.9649]],
       device='cuda:0')
squash tensor([[ 2.0648,  0.4144,  2.2268,  0.4850,  0.4214,  0.7197],
        [-1.8146, -0.6700, -0.4022,  0.5240, -0.6610, -0.2339],
        [-1.8503,  1.7839, -1.6806, -1.2367, -0.1450,  0.9305],
        [ 1.2150,  1.8190, -1.2247, -1.0801, -0.6217, -0.6316],
        [ 2.3189, -1.8660,  2.4554, -2.6724, -1.5291, -2.1327],
        [ 2.4152,  0.5679, -1.2700,  0.7764, -2.6427, -0.8106],
        [-3.2211, -2.5506, -1.8155,  0.8871,  2.1616,  1.8751],
        [-2.8878, -1.8751, -2.4092, -1.6493,  1.5872,  2.7970],
        [ 2.1404,  0.2808,  0.6665,  0.4902, -0.9887, -1.9308],
        [ 1.8278,  0.6963,  1.2534,  0.5134, -2.7036, -2.2246],
        [ 2.9666, -0.1894,  2.1132,  0.1674, -4.0095, -2.3640],
        [ 1.4443,  0.4927, -0.9149,  0.1907, -1.5028, -0.2057],
        [-5.5890, -1.1470, -1.9828,  1.3087,  4.6249,  3.0586],
        [-2.3935, -1.9228, -1.3419,  0.3247,  1.8605,  1.2661],
        [-1.2282, -2.6694, -0.5719,  1.7587,  1.1486,  1.3730],
        [ 1.1383, -1.4903,  1.5280,  1.4245,  0.2966,  1.0094],
        [ 1.7321, -1.0698,  1.2850,  0.6363, -1.8025,  2.2799],
        [-3.0940,  2.9804, -2.3579, -2.1252, -1.0342, -1.0916],
        [ 0.3345,  2.1726, -1.5284, -2.9579, -1.1116, -1.1185],
        [ 3.4396, -0.6837,  1.8352, -2.8090, -1.9835, -2.0118]],
       device='cuda:0')
action: tensor([[ 0.9929,  0.0827,  0.9899,  0.6627, -0.9811, -0.8740],
        [ 0.9935,  0.2816,  0.9815,  0.7606, -0.9765, -0.9379],
        [ 0.8320, -0.5921, -0.8411,  0.9670, -0.9443,  0.0881],
        [-0.9100, -0.4635, -0.9666,  0.9895,  0.9932,  0.9847],
        [-0.9903, -0.9683, -0.9576, -0.2150,  0.9324,  0.4112],
        [ 0.5522,  0.4220, -0.9401, -0.9313,  0.2875,  0.5908],
        [ 0.9574,  0.4732,  0.9986,  0.6916, -0.5840,  0.3987],
        [-0.9820,  0.1545, -0.8819,  0.5727,  0.0585,  0.7975],
        [-0.9781,  0.9270, -0.9223, -0.7434,  0.1968,  0.7826],
        [ 0.9918,  0.9544, -0.9830, -0.9601, -0.8659, -0.5799],
        [ 0.9967, -0.6065,  0.9919, -0.9721, -0.9673, -0.8569],
        [ 0.8683, -0.1158, -0.8555,  0.3239, -0.9683, -0.9815],
        [-0.9946, -0.9213, -0.8207,  0.5128,  0.8689,  0.7010],
        [-0.9384, -0.9859, -0.9502, -0.8140,  0.9809,  0.7616],
        [ 0.8497,  0.7976, -0.8338, -0.3780,  0.8435,  0.4460],
        [ 0.9983, -0.1582,  0.9932,  0.0922, -0.7510, -0.5158],
        [ 0.9906,  0.0550,  0.9760, -0.2378, -0.9840, -0.8679],
        [ 0.9178, -0.5511, -0.1327,  0.9693, -0.9666, -0.7788],
        [-0.9775, -0.9338, -0.9448,  0.4812,  0.9677,  0.2741],
        [-0.9722, -0.9903, -0.9422, -0.2975,  0.9442,  0.0373]],
       device='cuda:0')
squash tensor([[ 2.8197,  0.0829,  2.6423,  0.7977, -2.3273, -1.3497],
        [ 2.8607,  0.2894,  2.3373,  0.9976, -2.2166, -1.7206],
        [ 1.1945, -0.6808, -1.2249,  2.0440, -1.7759,  0.0883],
        [-1.5276, -0.5018, -2.0377,  2.6222,  2.8369,  2.4340],
        [-2.6638, -2.0651, -1.9160, -0.2184,  1.6767,  0.4371],
        [ 0.6215,  0.4501, -1.7387, -1.6683,  0.2958,  0.6788],
        [ 1.9137,  0.5142,  3.6488,  0.8511, -0.6686,  0.4221],
        [-2.3511,  0.1557, -1.3843,  0.6516,  0.0586,  1.0918],
        [-2.2521,  1.6369, -1.6045, -0.9580,  0.1994,  1.0519],
        [ 2.7457,  1.8792, -2.3798, -1.9477, -1.3163, -0.6624],
        [ 3.1965, -0.7034,  2.7551, -2.1293, -2.0493, -1.2816],
        [ 1.3263, -0.1163, -1.2764,  0.3360, -2.0638, -2.3382],
        [-2.9514, -1.5974, -1.1588,  0.5665,  1.3288,  0.8692],
        [-1.7241, -2.4727, -1.8343, -1.1387,  2.3218,  1.0000],
        [ 1.2549,  1.0919, -1.2005, -0.3978,  1.2331,  0.4797],
        [ 3.5446, -0.1596,  2.8422,  0.0925, -0.9752, -0.5706],
        [ 2.6755,  0.0551,  2.2053, -0.2424, -2.4086, -1.3245],
        [ 1.5747, -0.6200, -0.1335,  2.0807, -2.0378, -1.0423],
        [-2.2390, -1.6873, -1.7811,  0.5246,  2.0543,  0.2813],
        [-2.1313, -2.6595, -1.7576, -0.3067,  1.7758,  0.0373]],
       device='cuda:0')
action: tensor([[ 0.9944,  0.5266,  0.9948,  0.3279, -0.2005, -0.0034],
        [-0.9332, -0.6363, -0.5763,  0.3534,  0.2660,  0.2429],
        [-0.9716,  0.8261, -0.9467, -0.7129, -0.5791,  0.7349],
        [ 0.8073,  0.8408, -0.8723, -0.9568, -0.9102, -0.9562],
        [ 0.9413, -0.9666,  0.7772, -0.9759, -0.9352, -0.9530],
        [ 0.9463, -0.9509, -0.4581,  0.5545, -0.9816, -0.9119],
        [-0.9993, -0.6517, -0.9456,  0.7919,  0.9731,  0.7093],
        [-0.9833, -0.9915, -0.9646, -0.8956,  0.9842,  0.9952],
        [ 0.8606,  0.6467, -0.7188,  0.7954,  0.8127, -0.1067],
        [ 0.9963,  0.1557,  0.9947,  0.1014, -0.9465, -0.1992],
        [ 0.9784,  0.0011,  0.9859,  0.7649, -0.9855, -0.4021],
        [ 0.8824, -0.8344, -0.9771,  0.9756, -0.8886, -0.4454],
        [-0.9255, -0.9635, -0.9725,  0.9907,  0.9928,  0.6715],
        [-0.9688, -0.9892, -0.9307, -0.3794,  0.9297,  0.6423],
        [-0.0810,  0.9814, -0.9252, -0.8653, -0.5877,  0.3284],
        [ 0.9925,  0.9608,  0.9492,  0.4779, -0.7546,  0.1087],
        [ 0.9247,  0.5017,  0.9952,  0.7249, -0.3612, -0.1564],
        [ 0.9916,  0.7883,  0.5150, -0.4852, -0.9118, -0.9801],
        [ 0.9974, -0.1589, -0.4307,  0.6512, -0.6719, -0.8790],
        [-0.9932, -0.8651, -0.9791, -0.0654,  0.8355, -0.9671]],
       device='cuda:0')
squash tensor([[ 2.9416e+00,  5.8546e-01,  2.9722e+00,  3.4045e-01, -2.0325e-01,
         -3.4402e-03],
        [-1.6825e+00, -7.5193e-01, -6.5696e-01,  3.6937e-01,  2.7254e-01,
          2.4788e-01],
        [-2.1193e+00,  1.1756e+00, -1.7992e+00, -8.9297e-01, -6.6112e-01,
          9.3920e-01],
        [ 1.1193e+00,  1.2240e+00, -1.3427e+00, -1.9068e+00, -1.5289e+00,
         -1.8994e+00],
        [ 1.7491e+00, -2.0374e+00,  1.0383e+00, -2.2028e+00, -1.6981e+00,
         -1.8636e+00],
        [ 1.7952e+00, -1.8407e+00, -4.9496e-01,  6.2491e-01, -2.3393e+00,
         -1.5388e+00],
        [-3.9839e+00, -7.7820e-01, -1.7880e+00,  1.0764e+00,  2.1483e+00,
          8.8575e-01],
        [-2.3882e+00, -2.7266e+00, -2.0087e+00, -1.4493e+00,  2.4166e+00,
          3.0199e+00],
        [ 1.2955e+00,  7.6957e-01, -9.0517e-01,  1.0860e+00,  1.1348e+00,
         -1.0715e-01],
        [ 3.1515e+00,  1.5698e-01,  2.9684e+00,  1.0173e-01, -1.7971e+00,
         -2.0186e-01],
        [ 2.2588e+00,  1.1167e-03,  2.4746e+00,  1.0079e+00, -2.4605e+00,
         -4.2612e-01],
        [ 1.3864e+00, -1.2024e+00, -2.2289e+00,  2.1961e+00, -1.4153e+00,
         -4.7897e-01],
        [-1.6261e+00, -1.9927e+00, -2.1356e+00,  2.6806e+00,  2.8103e+00,
          8.1343e-01],
        [-2.0730e+00, -2.6089e+00, -1.6637e+00, -3.9940e-01,  1.6564e+00,
          7.6209e-01],
        [-8.1156e-02,  2.3347e+00, -1.6243e+00, -1.3142e+00, -6.7418e-01,
          3.4099e-01],
        [ 2.7885e+00,  1.9569e+00,  1.8232e+00,  5.2022e-01, -9.8365e-01,
          1.0913e-01],
        [ 1.6205e+00,  5.5159e-01,  3.0156e+00,  9.1789e-01, -3.7822e-01,
         -1.5771e-01],
        [ 2.7352e+00,  1.0668e+00,  5.6952e-01, -5.2975e-01, -1.5384e+00,
         -2.2998e+00],
        [ 3.3270e+00, -1.6031e-01, -4.6078e-01,  7.7746e-01, -8.1418e-01,
         -1.3712e+00],
        [-2.8430e+00, -1.3133e+00, -2.2751e+00, -6.5475e-02,  1.2060e+00,
         -2.0452e+00]], device='cuda:0')
action: tensor([[-0.9524, -0.9945, -0.7522,  0.5337,  0.9859, -0.6314],
        [-0.9319, -0.8931, -0.9342, -0.5898,  0.9406,  0.7694],
        [ 0.2512,  0.7831, -0.6632, -0.4818, -0.5616,  0.3115],
        [ 0.9559, -0.1516,  0.9782,  0.2213, -0.9693, -0.8544],
        [ 0.9829,  0.7068,  0.6950,  0.3294, -0.9990, -0.8160],
        [ 0.9889, -0.4521, -0.9695,  0.9513, -0.9500, -0.4331],
        [-0.9940, -0.9580, -0.9592,  0.9645,  0.9929,  0.9900],
        [-0.9677, -0.9849, -0.9843, -0.3342,  0.9434,  0.6397],
        [-0.0997, -0.0583, -0.9639, -0.2739,  0.8250,  0.4412],
        [ 0.9773,  0.4183,  0.9459,  0.7231, -0.1682,  0.3468],
        [ 0.8874, -0.6243,  0.9821,  0.7731, -0.8206, -0.1054],
        [ 0.9525, -0.7069,  0.0907,  0.9368, -0.7654, -0.7674],
        [ 0.6251, -0.8533, -0.6834,  0.9181, -0.9367, -0.9448],
        [-0.9664, -0.9954, -0.9758,  0.3362,  0.9810, -0.8885],
        [-0.9527, -0.9871, -0.9905, -0.9376,  0.9157,  0.6713],
        [ 0.7134,  0.9589, -0.9352, -0.8442, -0.6363, -0.8305],
        [ 0.9943,  0.2914,  0.9568,  0.5938, -0.6587, -0.7434],
        [ 0.9843,  0.4460,  0.9471,  0.1393, -0.9315, -0.6100],
        [ 0.9045,  0.8318, -0.0444,  0.3126, -0.9576, -0.9717],
        [-0.9951, -0.9591, -0.9427,  0.5242,  0.9716,  0.6400]],
       device='cuda:0')
squash tensor([[-1.8566, -2.9462, -0.9779,  0.5953,  2.4747, -0.7438],
        [-1.6725, -1.4369, -1.6902, -0.6773,  1.7435,  1.0189],
        [ 0.2567,  1.0533, -0.7985, -0.5253, -0.6351,  0.3222],
        [ 1.8963, -0.1528,  2.2545,  0.2250, -2.0802, -1.2721],
        [ 2.3776,  0.8808,  0.8576,  0.3421, -3.7798, -1.1446],
        [ 2.5956, -0.4874, -2.0846,  1.8457, -1.8315, -0.4638],
        [-2.9009, -1.9204, -1.9360,  2.0067,  2.8180,  2.6460],
        [-2.0552, -2.4402, -2.4212, -0.3476,  1.7678,  0.7577],
        [-0.1000, -0.0584, -1.9981, -0.2811,  1.1724,  0.4737],
        [ 2.2327,  0.4456,  1.7912,  0.9142, -0.1698,  0.3618],
        [ 1.4094, -0.7320,  2.3545,  1.0280, -1.1587, -0.1058],
        [ 1.8585, -0.8809,  0.0910,  1.7111, -1.0090, -1.0140],
        [ 0.7333, -1.2680, -0.8355,  1.5771, -1.7101, -1.7813],
        [-2.0354, -3.0330, -2.2003,  0.3498,  2.3233, -1.4146],
        [-1.8597, -2.5193, -2.6733, -1.7178,  1.5616,  0.8131],
        [ 0.8941,  1.9322, -1.6980, -1.2357, -0.7519, -1.1898],
        [ 2.9246,  0.3001,  1.9070,  0.6836, -0.7905, -0.9581],
        [ 2.4186,  0.4796,  1.8030,  0.1402, -1.6699, -0.7089],
        [ 1.4963,  1.1939, -0.0444,  0.3234, -1.9161, -2.1218],
        [-3.0039, -1.9350, -1.7616,  0.5821,  2.1204,  0.7581]],
       device='cuda:0')
action: tensor([[ 0.9874,  0.5584,  0.5773,  0.7856, -0.9562, -0.8758],
        [ 0.8284, -0.4480, -0.5386,  0.1060, -0.8635, -0.9383],
        [-0.9842, -0.9788, -0.9557,  0.4210,  0.9915,  0.5806],
        [-0.9585, -0.9820, -0.9782, -0.5669,  0.9436,  0.9215],
        [ 0.8715,  0.7091, -0.8853, -0.3610,  0.9456,  0.6205],
        [ 0.9453, -0.6058,  0.9465,  0.2091, -0.8356,  0.0949],
        [ 0.9843,  0.0126,  0.9998, -0.0630, -0.8583, -0.6066],
        [ 0.9962,  0.6991,  0.9500,  0.0091, -0.9754, -0.9347],
        [ 0.9469,  0.3151, -0.6349,  0.0746, -0.9744, -0.9453],
        [-0.9835, -0.9759, -0.9769,  0.1945,  0.9261, -0.1847],
        [-0.9770, -0.9950, -0.9578, -0.3955,  0.9600,  0.9626],
        [ 0.8905,  0.9431, -0.9946, -0.5101, -0.0282,  0.7358],
        [ 0.9831, -0.5540,  0.8837,  0.4824, -0.8550,  0.3814],
        [ 0.9885,  0.3490,  0.9695,  0.1620, -0.4639, -0.6708],
        [ 0.9511,  0.5869,  0.7840,  0.2103, -0.9393, -0.9867],
        [ 0.8586,  0.0167, -0.6955,  0.1793, -0.9141, -0.7405],
        [-0.9918, -0.9694, -0.9111,  0.5140,  0.8938,  0.0418],
        [-0.9898, -0.9990, -0.8200, -0.6693,  0.9876,  0.9267],
        [ 0.0356,  0.9648, -0.9862, -0.8806, -0.6728, -0.0952],
        [ 0.9932,  0.1583,  0.8661,  0.7248, -0.4004,  0.6931]],
       device='cuda:0')
squash tensor([[ 2.5321,  0.6305,  0.6584,  1.0597, -1.8999, -1.3575],
        [ 1.1830, -0.4822, -0.6023,  0.1064, -1.3071, -1.7240],
        [-2.4172, -2.2671, -1.8934,  0.4489,  2.7260,  0.6634],
        [-1.9267, -2.3504, -2.2539, -0.6430,  1.7700,  1.5989],
        [ 1.3391,  0.8854, -1.3998, -0.3780,  1.7881,  0.7258],
        [ 1.7855, -0.7023,  1.7974,  0.2122, -1.2066,  0.0952],
        [ 2.4191,  0.0126,  4.5985, -0.0631, -1.2868, -0.7035],
        [ 3.1320,  0.8655,  1.8317,  0.0091, -2.1933, -1.6940],
        [ 1.8010,  0.3262, -0.7495,  0.0748, -2.1736, -1.7857],
        [-2.3934, -2.2034, -2.2239,  0.1970,  1.6302, -0.1868],
        [-2.2280, -2.9949, -1.9181, -0.4183,  1.9462,  1.9802],
        [ 1.4243,  1.7653, -2.9546, -0.5629, -0.0283,  0.9413],
        [ 2.3820, -0.6241,  1.3926,  0.5261, -1.2743,  0.4017],
        [ 2.5774,  0.3644,  2.0834,  0.1634, -0.5023, -0.8122],
        [ 1.8427,  0.6729,  1.0556,  0.2135, -1.7324, -2.5051],
        [ 1.2881,  0.0167, -0.8585,  0.1813, -1.5517, -0.9517],
        [-2.7476, -2.0818, -1.5341,  0.5682,  1.4404,  0.0418],
        [-2.6343, -3.7970, -1.1567, -0.8094,  2.5388,  1.6342],
        [ 0.0356,  2.0117, -2.4856, -1.3784, -0.8158, -0.0954],
        [ 2.8408,  0.1597,  1.3173,  0.9177, -0.4241,  0.8539]],
       device='cuda:0')
action: tensor([[-0.9332, -0.9776, -0.9621, -0.4937,  0.9821,  0.7306],
        [ 0.7389, -0.2139, -0.3299,  0.1996,  0.3965,  0.5729],
        [ 0.9930,  0.2698,  0.9907,  0.5784, -0.3424, -0.7092],
        [ 0.9351, -0.1234,  0.9867, -0.4875, -0.9349, -0.8992],
        [ 0.9904,  0.4737,  0.9997, -0.2713, -0.9250, -0.6588],
        [ 0.9874,  0.4173, -0.9825,  0.6514, -0.8329, -0.8338],
        [-0.9923, -0.9752, -0.9325, -0.2259,  0.9897,  0.9596],
        [-0.9942, -0.9844, -0.9863, -0.6330,  0.9915,  0.8490],
        [ 0.7823, -0.5058, -0.2421,  0.3759,  0.9627,  0.8112],
        [ 0.8623,  0.2190,  0.9347,  0.3305, -0.1851,  0.3049],
        [-0.9126, -0.3856, -0.3753,  0.5665, -0.9122,  0.6493],
        [-0.9631,  0.8831, -0.9629, -0.8716, -0.4555,  0.6618],
        [ 0.9149,  0.7666, -0.8908, -0.8613, -0.3895, -0.7360],
        [ 0.9977, -0.8443,  0.8588, -0.9938, -0.9520, -0.7904],
        [ 0.9129,  0.4531, -0.9765,  0.5089, -0.9864, -0.9597],
        [-0.9974, -0.9809, -0.9793,  0.7911,  0.9876,  0.9817],
        [-0.9895, -0.9902, -0.9576, -0.9473,  0.9659,  0.9833],
        [ 0.4810,  0.7912, -0.9695,  0.1920,  0.5590,  0.4459],
        [ 0.9938, -0.0526,  0.9980,  0.7798, -0.8666, -0.8679],
        [ 0.9911,  0.2804,  0.8802, -0.1061, -0.9741, -0.9200]],
       device='cuda:0')
squash tensor([[-1.6825, -2.2402, -1.9738, -0.5410,  2.3545,  0.9301],
        [ 0.9480, -0.2173, -0.3428,  0.2023,  0.4195,  0.6518],
        [ 2.8272,  0.2767,  2.6853,  0.6601, -0.3568, -0.8857],
        [ 1.6976, -0.1241,  2.5041, -0.5327, -1.6961, -1.4679],
        [ 2.6680,  0.5148,  4.4665, -0.2783, -1.6226, -0.7906],
        [ 2.5305,  0.4444, -2.3645,  0.7777, -1.1974, -1.2006],
        [-2.7751, -2.1889, -1.6770, -0.2299,  2.6297,  1.9414],
        [-2.9169, -2.4227, -2.4871, -0.7464,  2.7274,  1.2527],
        [ 1.0512, -0.5571, -0.2470,  0.3953,  1.9817,  1.1304],
        [ 1.3024,  0.2226,  1.6943,  0.3434, -0.1873,  0.3149],
        [-1.5431, -0.4067, -0.3946,  0.6423, -1.5403,  0.7740],
        [-1.9871,  1.3899, -1.9838, -1.3397, -0.4916,  0.7960],
        [ 1.5570,  1.0120, -1.4257, -1.2983, -0.4112, -0.9417],
        [ 3.3739, -1.2360,  1.2887, -2.8831, -1.8523, -1.0726],
        [ 1.5445,  0.4886, -2.2151,  0.5612, -2.4931, -1.9419],
        [-3.3279, -2.3216, -2.2803,  1.0745,  2.5367,  2.3414],
        [-2.6227, -2.6576, -1.9162, -1.8052,  2.0276,  2.3874],
        [ 0.5243,  1.0746, -2.0844,  0.1945,  0.6314,  0.4795],
        [ 2.8840, -0.0527,  3.4449,  1.0449, -1.3194, -1.3246],
        [ 2.7025,  0.2881,  1.3765, -0.1065, -2.1676, -1.5891]],
       device='cuda:0')
action: tensor([[ 0.9549, -0.6305,  0.9891,  0.4210, -0.8091, -0.2373],
        [ 0.9901, -0.0322,  0.9994, -0.5019, -0.8574,  0.6160],
        [ 0.9994,  0.1998,  0.8371,  0.3342, -0.9789, -0.7794],
        [ 0.9861,  0.2963, -0.8200,  0.2839, -0.9450, -0.8266],
        [-0.9727, -0.9596, -0.7919, -0.0420,  0.9151, -0.7985],
        [-0.9654, -0.9466, -0.8721, -0.5847,  0.9669,  0.9298],
        [ 0.7478, -0.1017,  0.0386, -0.1591,  0.4229,  0.2168],
        [ 0.9168,  0.5963,  0.9724,  0.5881, -0.8839, -0.8421],
        [ 0.9928,  0.7664,  0.9571,  0.4566, -0.9942, -0.3056],
        [ 0.9616,  0.3680, -0.9887,  0.9495, -0.9384,  0.8816],
        [-0.9797, -0.9262, -0.9849,  0.9654,  0.9875,  0.9359],
        [-0.9289, -0.9145, -0.9756,  0.0420,  0.9287,  0.8947],
        [ 0.9046,  0.3345, -0.9096,  0.4680,  0.7822,  0.3550],
        [ 0.9518, -0.5063,  0.9722,  0.3906, -0.6215,  0.6893],
        [-0.3165,  0.0999,  0.3130,  0.4180, -0.7347, -0.0125],
        [-0.9380,  0.9766, -0.8213, -0.4096, -0.1715,  0.9266],
        [ 0.9142,  0.8549, -0.9104, -0.9288, -0.7676, -0.7449],
        [ 0.9763, -0.9908,  0.7981, -0.9448, -0.8068, -0.9489],
        [ 0.9985, -0.8042, -0.6706,  0.8493, -0.9872, -0.9793],
        [-0.9802, -0.3384, -0.9939,  0.3579,  0.9434,  0.8319]],
       device='cuda:0')
squash tensor([[ 1.8846, -0.7423,  2.6043,  0.4489, -1.1243, -0.2419],
        [ 2.6526, -0.0322,  4.0795, -0.5519, -1.2836,  0.7186],
        [ 4.0658,  0.2025,  1.2115,  0.3476, -2.2714, -1.0440],
        [ 2.4817,  0.3054, -1.1568,  0.2920, -1.7831, -1.1775],
        [-2.1402, -1.9407, -1.0764, -0.0420,  1.5583, -1.0943],
        [-2.0202, -1.7984, -1.3419, -0.6695,  2.0430,  1.6570],
        [ 0.9679, -0.1020,  0.0386, -0.1604,  0.4512,  0.2203],
        [ 1.5685,  0.6874,  2.1352,  0.6748, -1.3933, -1.2283],
        [ 2.8133,  1.0115,  1.9108,  0.4930, -2.9190, -0.3157],
        [ 1.9665,  0.3861, -2.5832,  1.8266, -1.7243,  1.3827],
        [-2.2910, -1.6310, -2.4385,  2.0191,  2.5332,  1.7042],
        [-1.6506, -1.5546, -2.1977,  0.0420,  1.6488,  1.4451],
        [ 1.4968,  0.3478, -1.5254,  0.5075,  1.0511,  0.3711],
        [ 1.8508, -0.5578,  2.1312,  0.4125, -0.7274,  0.8466],
        [-0.3277,  0.1003,  0.3238,  0.4452, -0.9388, -0.0125],
        [-1.7214,  2.2171, -1.1607, -0.4351, -0.1732,  1.6338],
        [ 1.5523,  1.2739, -1.5300, -1.6494, -1.0145, -0.9614],
        [ 2.2125, -2.6891,  1.0935, -1.7814, -1.1178, -1.8206],
        [ 3.6064, -1.1105, -0.8118,  1.2536, -2.5216, -2.2811],
        [-2.3033, -0.3523, -2.8936,  0.3745,  1.7679,  1.1944]],
       device='cuda:0')
action: tensor([[ 0.8494,  0.8236, -0.9206, -0.9324,  0.5757, -0.1656],
        [ 0.9610,  0.5961,  0.9916,  0.7872, -0.4193,  0.6812],
        [-0.9879,  0.8774, -0.9051, -0.1646, -0.0986, -0.1116],
        [ 0.9059,  0.9689, -0.9813, -0.8697,  0.0872,  0.2029],
        [ 0.9306, -0.7944,  0.9869, -0.9628, -0.8276, -0.9613],
        [ 0.8560,  0.7226, -0.5785,  0.2472, -0.9121, -0.7294],
        [-0.8931, -0.7549, -0.9813,  0.6333,  0.9469,  0.8073],
        [-0.9241, -0.9822, -0.9340, -0.6944,  0.9818,  0.7467],
        [ 0.7395, -0.0281,  0.4506,  0.9508,  0.8520,  0.8323],
        [ 0.8881,  0.5434,  0.9711,  0.4046, -0.9936, -0.8730],
        [ 0.9961,  0.7068,  0.9909,  0.9619, -0.9718, -0.8700],
        [ 0.9248, -0.5640, -0.5695,  0.9786, -0.9367, -0.5845],
        [-0.9626, -0.9787, -0.9850,  0.9989,  0.9665,  0.8760],
        [-0.9158, -0.9538, -0.9005,  0.6755,  0.9815,  0.6958],
        [ 0.0716,  0.3309, -0.9442, -0.9699, -0.1285, -0.1632],
        [ 0.9958,  0.9737,  0.9767, -0.1924, -0.6459, -0.2390],
        [-0.8476, -0.3517, -0.6203,  0.7900,  0.9379, -0.1508],
        [-0.9472,  0.7880, -0.9795, -0.8108,  0.3521,  0.7453],
        [ 0.9832,  0.9965, -0.9803, -0.9841, -0.9462, -0.7225],
        [ 0.9957, -0.1378,  0.9838, -0.9892, -0.7836, -0.8883]],
       device='cuda:0')
squash tensor([[ 1.2540,  1.1679, -1.5930, -1.6767,  0.6560, -0.1671],
        [ 1.9582,  0.6871,  2.7316,  1.0639, -0.4468,  0.8313],
        [-2.5498,  1.3643, -1.4995, -0.1661, -0.0989, -0.1121],
        [ 1.5041,  2.0748, -2.3328, -1.3319,  0.0875,  0.2058],
        [ 1.6632, -1.0832,  2.5112, -1.9833, -1.1803, -1.9628],
        [ 1.2781,  0.9130, -0.6603,  0.2524, -1.5399, -0.9275],
        [-1.4372, -0.9842, -2.3318,  0.7469,  1.8014,  1.1192],
        [-1.6161, -2.3567, -1.6888, -0.8563,  2.3452,  0.9655],
        [ 0.9494, -0.0281,  0.4854,  1.8400,  1.2634,  1.1957],
        [ 1.4130,  0.6090,  2.1104,  0.4291, -2.8714, -1.3456],
        [ 3.1143,  0.8807,  2.6956,  1.9712, -2.1235, -1.3329],
        [ 1.6215, -0.6387, -0.6467,  2.2631, -1.7107, -0.6693],
        [-1.9800, -2.2669, -2.4436,  3.7510,  2.0363,  1.3584],
        [-1.5621, -1.8723, -1.4748,  0.8207,  2.3359,  0.8590],
        [ 0.0718,  0.3438, -1.7758, -2.0904, -0.1292, -0.1647],
        [ 3.0870,  2.1589,  2.2210, -0.1948, -0.7683, -0.2437],
        [-1.2476, -0.3673, -0.7255,  1.0714,  1.7206, -0.1519],
        [-1.8038,  1.0661, -2.2857, -1.1292,  0.3679,  0.9622],
        [ 2.3868,  3.1718, -2.3059, -2.4118, -1.7941, -0.9129],
        [ 3.0701, -0.1387,  2.4046, -2.6058, -1.0547, -1.4140]],
       device='cuda:0')
action: tensor([[-0.9573, -0.9721, -0.7003, -0.1970,  0.9874,  0.9799],
        [ 0.8575,  0.8736, -0.9859, -0.4963, -0.3369,  0.6589],
        [ 0.8339,  0.7806,  0.9244,  0.1163, -0.9745, -0.2165],
        [-0.9205,  0.8027, -0.9749,  0.1517,  0.3327,  0.7805],
        [-0.5570,  0.7463, -0.7395, -0.8750, -0.8060, -0.6887],
        [ 0.5508,  0.8422, -0.9290, -0.7299,  0.1329, -0.5220],
        [ 0.9927, -0.7181,  0.9474, -0.9352, -0.8628, -0.9619],
        [ 0.9634, -0.1751, -0.7185,  0.8500, -0.9185, -0.8054],
        [-0.9972, -0.9957, -0.9572,  0.9868,  0.9840,  0.9175],
        [-0.9748, -0.9882, -0.9518, -0.3385,  0.9864,  0.9841],
        [ 0.7871,  0.4918, -0.5247,  0.9121,  0.2535,  0.2131],
        [ 0.9646,  0.1655,  0.9741,  0.5498, -0.9895, -0.8022],
        [ 0.9256, -0.0800,  0.7278,  0.9426, -0.9238, -0.8868],
        [-0.2859, -0.5782, -0.6398,  0.9817, -0.7016,  0.2192],
        [-0.9651, -0.9892, -0.9951,  0.9881,  0.8023,  0.2335],
        [-0.9536, -0.9249, -0.9281, -0.1067,  0.9426,  0.8413],
        [ 0.0446,  0.9212, -0.9713, -0.8844,  0.4313, -0.5393],
        [ 0.9953,  0.1759,  0.9762,  0.4285, -0.9078,  0.2372],
        [ 0.9567, -0.1776,  0.9145,  0.8670, -0.8594, -0.7368],
        [ 0.9538, -0.6704, -0.8161,  0.9492, -0.9620, -0.2660]],
       device='cuda:0')
squash tensor([[-1.9124, -2.1293, -0.8679, -0.1996,  2.5285,  2.2948],
        [ 1.2837,  1.3480, -2.4746, -0.5444, -0.3506,  0.7909],
        [ 1.2009,  1.0469,  1.6187,  0.1168, -2.1743, -0.2200],
        [-1.5922,  1.1061, -2.1824,  0.1528,  0.3458,  1.0467],
        [-0.6285,  0.9645, -0.9493, -1.3540, -1.1155, -0.8456],
        [ 0.6196,  1.2286, -1.6513, -0.9285,  0.1337, -0.5791],
        [ 2.8079, -0.9037,  1.8056, -1.6981, -1.3043, -1.9704],
        [ 1.9906, -0.1769, -0.9045,  1.2561, -1.5796, -1.1139],
        [-3.2796, -3.0743, -1.9120,  2.5051,  2.4092,  1.5732],
        [-2.1813, -2.5645, -1.8511, -0.3524,  2.4937,  2.4132],
        [ 1.0637,  0.5385, -0.5828,  1.5398,  0.2591,  0.2164],
        [ 2.0077,  0.1670,  2.1665,  0.6181, -2.6213, -1.1046],
        [ 1.6268, -0.0802,  0.9241,  1.7612, -1.6141, -1.4069],
        [-0.2941, -0.6597, -0.7579,  2.3427, -0.8704,  0.2228],
        [-2.0161, -2.6082, -3.0020,  2.5610,  1.1050,  0.2379],
        [-1.8696, -1.6222, -1.6442, -0.1071,  1.7611,  1.2255],
        [ 0.0446,  1.5966, -2.1156, -1.3956,  0.4615, -0.6032],
        [ 3.0266,  0.1778,  2.2103,  0.4580, -1.5149,  0.2418],
        [ 1.9049, -0.1795,  1.5544,  1.3210, -1.2912, -0.9435],
        [ 1.8719, -0.8115, -1.1450,  1.8240, -1.9714, -0.2725]],
       device='cuda:0')
action: tensor([[ 0.7550, -0.4002,  0.9907,  0.4916, -0.8542,  0.5469],
        [ 0.9960,  0.4730,  0.9425, -0.3415, -0.9602, -0.0872],
        [ 0.9324, -0.0191,  0.3697,  0.7786, -0.9472, -0.5761],
        [-0.3553, -0.3797, -0.7915,  0.4369,  0.2559,  0.5753],
        [-0.5626, -0.9925, -0.9659, -0.1551,  0.9753,  0.7655],
        [-0.8592, -0.4489, -0.2387,  0.4759,  0.8982,  0.6082],
        [ 0.9782,  0.7419,  0.9742,  0.7323, -0.3910, -0.5233],
        [ 0.9695, -0.7095,  0.9984,  0.8853, -0.8878,  0.3931],
        [ 0.2710, -0.8949, -0.4065,  0.9780, -0.8353,  0.5568],
        [-0.9272, -0.9624, -0.9456,  0.9658,  0.8154,  0.9236],
        [-0.9856, -0.9611, -0.8825,  0.3291,  0.9926,  0.9453],
        [ 0.6412,  0.9637, -0.8369, -0.7571, -0.1837, -0.5192],
        [ 0.9664,  0.3362,  0.9878,  0.6777, -0.3653, -0.7608],
        [-0.9755,  0.7542, -0.8212,  0.0587, -0.2973, -0.6461],
        [ 0.6985,  0.8769, -0.9533, -0.9126, -0.6199, -0.3230],
        [ 0.9857, -0.9293,  0.9890, -0.9939, -0.9555, -0.6919],
        [ 0.9968, -0.4747, -0.9690,  0.0450, -0.9957, -0.8553],
        [-0.9948, -0.8656, -0.9031,  0.6088,  0.9530,  0.7949],
        [-0.9910, -0.9979, -0.8850, -0.6340,  0.9621,  0.9345],
        [ 0.9731,  0.0879, -0.2170,  0.7532,  0.9431,  0.6070]],
       device='cuda:0')
squash tensor([[ 0.9845, -0.4239,  2.6831,  0.5382, -1.2715,  0.6140],
        [ 3.1004,  0.5139,  1.7596, -0.3558, -1.9488, -0.0874],
        [ 1.6767, -0.0191,  0.3881,  1.0418, -1.8042, -0.6567],
        [-0.3714, -0.3998, -1.0755,  0.4684,  0.2618,  0.6553],
        [-0.6366, -2.7942, -2.0276, -0.1563,  2.1908,  1.0093],
        [-1.2902, -0.4833, -0.2434,  0.5177,  1.4630,  0.7060],
        [ 2.2540,  0.9546,  2.1686,  0.9338, -0.4129, -0.5809],
        [ 2.0831, -0.8861,  3.5604,  1.3999, -1.4113,  0.4155],
        [ 0.2779, -1.4460, -0.4314,  2.2490, -1.2053,  0.6282],
        [-1.6383, -1.9775, -1.7881,  2.0255,  1.1429,  1.6129],
        [-2.4633, -1.9596, -1.3871,  0.3418,  2.7983,  1.7861],
        [ 0.7602,  1.9954, -1.2109, -0.9895, -0.1859, -0.5753],
        [ 2.0349,  0.3499,  2.5464,  0.8248, -0.3830, -0.9980],
        [-2.1956,  0.9827, -1.1606,  0.0588, -0.3066, -0.7686],
        [ 0.8643,  1.3622, -1.8667, -1.5428, -0.7249, -0.3350],
        [ 2.4672, -1.6533,  2.5975, -2.8960, -1.8911, -0.8516],
        [ 3.2206, -0.5161, -2.0759,  0.0450, -3.0714, -1.2755],
        [-2.9781, -1.3152, -1.4886,  0.7070,  1.8640,  1.0846],
        [-2.7020, -3.4227, -1.3982, -0.7481,  1.9736,  1.6929],
        [ 2.1474,  0.0881, -0.2205,  0.9802,  1.7651,  0.7042]],
       device='cuda:0')
action: tensor([[ 0.9135, -0.3215, -0.9645,  0.9811, -0.9837,  0.0270],
        [-0.9679, -0.9504, -0.9401,  0.9948,  0.9819,  0.9568],
        [-0.9296, -0.9449, -0.9915, -0.3172,  0.8258,  0.6095],
        [ 0.4865,  0.8303, -0.9662, -0.9846, -0.7881,  0.9721],
        [ 0.9890,  0.3726,  0.9833,  0.7171, -0.4761, -0.4109],
        [-0.8228,  0.3062, -0.7239,  0.2009,  0.4226, -0.3556],
        [-0.9529,  0.9511, -0.9255, -0.8645, -0.7874,  0.8978],
        [ 0.9854,  0.9202, -0.6688, -0.9629, -0.7685, -0.9353],
        [ 0.9984, -0.6782,  0.9828, -0.9924, -0.9184, -0.9569],
        [ 0.9702,  0.5470, -0.8864,  0.7395, -0.9314, -0.9720],
        [-0.9905, -0.9827, -0.9765,  0.6320,  0.9775,  0.6342],
        [-0.9770, -0.9465, -0.7952, -0.8991,  0.9321,  0.9946],
        [ 0.6027,  0.3436, -0.7966,  0.5560,  0.5997,  0.2423],
        [ 0.9017,  0.4966,  0.9848,  0.5837, -0.9423, -0.9690],
        [ 0.9620,  0.3012,  0.9809,  0.3470, -0.9793, -0.8658],
        [ 0.9938,  0.4379, -0.7858,  0.8458, -0.9720, -0.0302],
        [-0.9854, -0.9570, -0.9162,  0.8254,  0.9680,  0.8605],
        [-0.9882, -0.9818, -0.7777,  0.1168,  0.9650,  0.9891],
        [ 0.7323, -0.0830, -0.8339, -0.3108,  0.2208,  0.3848],
        [ 0.9775,  0.5395,  0.9951,  0.8463,  0.3070,  0.8796]],
       device='cuda:0')
squash 