/home/miao/Research/rl-starter-files/scripts/train.py --algo ppo --env MiniGrid-DoorKey-5x5-v0 --model DoorKey --save-interval 10 --frames 80000

Namespace(algo='ppo', batch_size=256, clip_eps=0.2, discount=0.99, entropy_coef=0.01, env='MiniGrid-DoorKey-5x5-v0', epochs=4, frames=80000, frames_per_proc=None, gae_lambda=0.95, log_interval=1, lr=0.001, max_grad_norm=0.5, mem=False, model='DoorKey', optim_alpha=0.99, optim_eps=1e-08, procs=16, recurrence=1, save_interval=10, seed=1, text=False, value_loss_coef=0.5)

Device: cpu

Environments loaded

Training status loaded

Observations preprocessor loaded
Model loaded

ACModel(
  (image_conv): Sequential(
    (0): Conv2d(3, 16, kernel_size=(2, 2), stride=(1, 1))
    (1): ReLU()
    (2): MaxPool2d(kernel_size=(2, 2), stride=(2, 2), padding=0, dilation=1, ceil_mode=False)
    (3): Conv2d(16, 32, kernel_size=(2, 2), stride=(1, 1))
    (4): ReLU()
    (5): Conv2d(32, 64, kernel_size=(2, 2), stride=(1, 1))
    (6): ReLU()
  )
  (actor): Sequential(
    (0): Linear(in_features=64, out_features=64, bias=True)
    (1): Tanh()
    (2): Linear(in_features=64, out_features=7, bias=True)
  )
  (critic): Sequential(
    (0): Linear(in_features=64, out_features=64, bias=True)
    (1): Tanh()
    (2): Linear(in_features=64, out_features=1, bias=True)
  )
)

Optimizer loaded

U 1 | F 002048 | FPS 4490 | D 0 | rR:μσmM 0.00 0.00 0.00 0.00 | F:μσmM 0.0 0.0 0 0 | H 1.918 | V -0.099 | pL -0.015 | vL 0.001 | ∇ 0.040
U 2 | F 004096 | FPS 4265 | D 0 | rR:μσmM 0.06 0.13 0.00 0.51 | F:μσmM 239.8 27.9 137.0 250.0 | H 1.933 | V -0.066 | pL -0.031 | vL 0.002 | ∇ 0.021
U 3 | F 006144 | FPS 4347 | D 1 | rR:μσmM 0.04 0.10 0.00 0.33 | F:μσmM 242.9 17.0 186.0 250.0 | H 1.931 | V -0.056 | pL -0.014 | vL 0.001 | ∇ 0.011
U 4 | F 008192 | FPS 4378 | D 1 | rR:μσmM 0.02 0.08 0.00 0.33 | F:μσmM 246.0 15.5 186.0 250.0 | H 1.939 | V -0.046 | pL -0.016 | vL 0.000 | ∇ 0.006
U 5 | F 010240 | FPS 4248 | D 2 | rR:μσmM 0.00 0.00 0.00 0.00 | F:μσmM 250.0 0.0 250.0 250.0 | H 1.943 | V -0.041 | pL -0.008 | vL 0.000 | ∇ 0.004
U 6 | F 012288 | FPS 4400 | D 2 | rR:μσmM 0.03 0.10 0.00 0.42 | F:μσmM 244.4 21.8 160.0 250.0 | H 1.943 | V -0.028 | pL -0.013 | vL 0.001 | ∇ 0.009
U 7 | F 014336 | FPS 4273 | D 3 | rR:μσmM 0.03 0.10 0.00 0.42 | F:μσmM 244.4 21.8 160.0 250.0 | H 1.943 | V -0.022 | pL -0.004 | vL 0.000 | ∇ 0.004
U 8 | F 016384 | FPS 4340 | D 3 | rR:μσmM 0.04 0.10 0.00 0.31 | F:μσmM 242.9 17.1 191.0 250.0 | H 1.941 | V -0.011 | pL -0.011 | vL 0.000 | ∇ 0.008
U 9 | F 018432 | FPS 4315 | D 4 | rR:μσmM 0.04 0.10 0.00 0.31 | F:μσmM 242.9 17.1 191.0 250.0 | H 1.944 | V -0.007 | pL -0.004 | vL 0.000 | ∇ 0.005
U 10 | F 020480 | FPS 4076 | D 4 | rR:μσmM 0.02 0.08 0.00 0.32 | F:μσmM 246.1 15.0 188.0 250.0 | H 1.942 | V -0.001 | pL -0.003 | vL 0.000 | ∇ 0.006
Status saved
U 11 | F 022528 | FPS 4350 | D 5 | rR:μσmM 0.06 0.17 0.00 0.58 | F:μσmM 236.3 37.2 117.0 250.0 | H 1.935 | V 0.011 | pL -0.009 | vL 0.002 | ∇ 0.031
U 12 | F 024576 | FPS 4248 | D 5 | rR:μσmM 0.09 0.18 0.00 0.58 | F:μσmM 231.0 40.7 117.0 250.0 | H 1.936 | V 0.009 | pL -0.003 | vL 0.001 | ∇ 0.019
U 13 | F 026624 | FPS 4258 | D 6 | rR:μσmM 0.15 0.23 0.00 0.62 | F:μσmM 217.2 50.1 106.0 250.0 | H 1.922 | V 0.022 | pL -0.017 | vL 0.002 | ∇ 0.037
U 14 | F 028672 | FPS 4301 | D 6 | rR:μσmM 0.16 0.27 0.00 0.80 | F:μσmM 213.4 65.0 56.0 250.0 | H 1.924 | V 0.022 | pL -0.007 | vL 0.003 | ∇ 0.034
U 15 | F 030720 | FPS 4265 | D 7 | rR:μσmM 0.27 0.30 0.00 0.77 | F:μσmM 188.1 71.5 63.0 250.0 | H 1.897 | V 0.074 | pL -0.017 | vL 0.005 | ∇ 0.028
U 16 | F 032768 | FPS 4410 | D 7 | rR:μσmM 0.33 0.32 0.00 0.85 | F:μσmM 176.8 78.3 42.0 250.0 | H 1.906 | V 0.074 | pL -0.012 | vL 0.005 | ∇ 0.041
U 17 | F 034816 | FPS 4201 | D 8 | rR:μσmM 0.25 0.23 0.00 0.66 | F:μσmM 197.6 53.2 94.0 250.0 | H 1.903 | V 0.115 | pL -0.003 | vL 0.004 | ∇ 0.029
U 18 | F 036864 | FPS 4294 | D 8 | rR:μσmM 0.34 0.23 0.00 0.73 | F:μσmM 178.7 56.2 75.0 250.0 | H 1.866 | V 0.144 | pL -0.008 | vL 0.005 | ∇ 0.042
U 19 | F 038912 | FPS 4267 | D 9 | rR:μσmM 0.55 0.28 0.00 0.90 | F:μσmM 122.1 72.4 28.0 250.0 | H 1.825 | V 0.177 | pL -0.042 | vL 0.008 | ∇ 0.057
U 20 | F 040960 | FPS 4276 | D 9 | rR:μσmM 0.53 0.28 0.00 0.94 | F:μσmM 128.6 72.5 18.0 250.0 | H 1.803 | V 0.221 | pL -0.036 | vL 0.010 | ∇ 0.056
Status saved
U 21 | F 043008 | FPS 4411 | D 10 | rR:μσmM 0.74 0.12 0.46 0.92 | F:μσmM 71.2 34.5 21.0 149.0 | H 1.794 | V 0.301 | pL -0.068 | vL 0.013 | ∇ 0.073
U 22 | F 045056 | FPS 4269 | D 10 | rR:μσmM 0.79 0.18 0.00 0.95 | F:μσmM 58.7 45.4 15.0 250.0 | H 1.692 | V 0.424 | pL -0.091 | vL 0.016 | ∇ 0.101
U 23 | F 047104 | FPS 4217 | D 11 | rR:μσmM 0.80 0.14 0.25 0.95 | F:μσmM 55.2 37.7 13.0 208.0 | H 1.634 | V 0.492 | pL -0.075 | vL 0.014 | ∇ 0.112
U 24 | F 049152 | FPS 4313 | D 11 | rR:μσmM 0.85 0.10 0.52 0.96 | F:μσmM 40.3 26.9 11.0 134.0 | H 1.527 | V 0.565 | pL -0.075 | vL 0.012 | ∇ 0.109
U 25 | F 051200 | FPS 4226 | D 11 | rR:μσmM 0.88 0.12 0.00 0.97 | F:μσmM 33.7 30.9 8.0 250.0 | H 1.447 | V 0.659 | pL -0.093 | vL 0.009 | ∇ 0.123
U 26 | F 053248 | FPS 4266 | D 12 | rR:μσmM 0.90 0.05 0.70 0.96 | F:μσmM 27.4 14.4 10.0 82.0 | H 1.401 | V 0.714 | pL -0.066 | vL 0.005 | ∇ 0.087
U 27 | F 055296 | FPS 4239 | D 12 | rR:μσmM 0.91 0.04 0.75 0.97 | F:μσmM 23.6 11.8 9.0 69.0 | H 1.331 | V 0.772 | pL -0.052 | vL 0.004 | ∇ 0.100
U 28 | F 057344 | FPS 4124 | D 13 | rR:μσmM 0.93 0.03 0.84 0.97 | F:μσmM 20.1 7.7 9.0 44.0 | H 1.257 | V 0.805 | pL -0.048 | vL 0.002 | ∇ 0.061
U 29 | F 059392 | FPS 3965 | D 13 | rR:μσmM 0.93 0.02 0.84 0.97 | F:μσmM 18.1 6.9 8.0 44.0 | H 1.204 | V 0.828 | pL -0.027 | vL 0.002 | ∇ 0.052
U 30 | F 061440 | FPS 4103 | D 14 | rR:μσmM 0.93 0.03 0.85 0.97 | F:μσmM 18.1 7.4 7.0 41.0 | H 1.236 | V 0.839 | pL -0.017 | vL 0.001 | ∇ 0.033
Status saved
U 31 | F 063488 | FPS 4121 | D 14 | rR:μσmM 0.93 0.03 0.86 0.97 | F:μσmM 18.6 7.0 8.0 39.0 | H 1.283 | V 0.838 | pL -0.007 | vL 0.001 | ∇ 0.038
U 32 | F 065536 | FPS 4226 | D 15 | rR:μσmM 0.93 0.03 0.83 0.97 | F:μσmM 19.3 8.0 8.0 48.0 | H 1.293 | V 0.835 | pL 0.005 | vL 0.001 | ∇ 0.029
U 33 | F 067584 | FPS 4227 | D 15 | rR:μσmM 0.93 0.02 0.86 0.97 | F:μσmM 18.1 6.3 9.0 38.0 | H 1.290 | V 0.840 | pL -0.009 | vL 0.001 | ∇ 0.025
U 34 | F 069632 | FPS 4167 | D 16 | rR:μσmM 0.93 0.03 0.83 0.96 | F:μσmM 19.0 7.2 10.0 48.0 | H 1.336 | V 0.838 | pL 0.004 | vL 0.001 | ∇ 0.027
U 35 | F 071680 | FPS 4234 | D 16 | rR:μσmM 0.93 0.03 0.84 0.96 | F:μσmM 20.1 7.2 10.0 44.0 | H 1.311 | V 0.832 | pL 0.006 | vL 0.001 | ∇ 0.033
U 36 | F 073728 | FPS 4003 | D 17 | rR:μσmM 0.93 0.03 0.85 0.97 | F:μσmM 19.9 7.1 8.0 41.0 | H 1.371 | V 0.835 | pL 0.002 | vL 0.001 | ∇ 0.036
U 37 | F 075776 | FPS 4151 | D 17 | rR:μσmM 0.93 0.03 0.85 0.97 | F:μσmM 19.5 7.3 9.0 42.0 | H 1.402 | V 0.837 | pL 0.014 | vL 0.002 | ∇ 0.038
U 38 | F 077824 | FPS 4192 | D 18 | rR:μσmM 0.92 0.03 0.80 0.97 | F:μσmM 21.3 8.6 9.0 55.0 | H 1.451 | V 0.806 | pL 0.022 | vL 0.002 | ∇ 0.049
U 39 | F 079872 | FPS 4089 | D 18 | rR:μσmM 0.91 0.08 0.24 0.96 | F:μσmM 24.8 22.5 10.0 212.0 | H 1.410 | V 0.804 | pL 0.008 | vL 0.003 | ∇ 0.059
U 40 | F 081920 | FPS 4085 | D 19 | rR:μσmM 0.92 0.03 0.84 0.97 | F:μσmM 22.0 7.4 8.0 44.0 | H 1.364 | V 0.814 | pL -0.009 | vL 0.001 | ∇ 0.034
Status saved
